From f8f67a788e4c8dc41b59d6f22631172fb4a431df Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Thu, 25 Jun 2020 19:55:45 +0300
Subject: [PATCH 001/341] allow to turn on fsync on inserts and merges

---
 src/Disks/DiskLocal.cpp                       | 17 +++++++-
 src/Disks/DiskLocal.h                         |  2 +
 src/Disks/DiskMemory.cpp                      |  5 +++
 src/Disks/DiskMemory.h                        |  2 +
 src/Disks/IDisk.h                             |  3 ++
 src/Disks/S3/DiskS3.cpp                       |  5 +++
 src/Disks/S3/DiskS3.h                         |  2 +
 .../MergeTree/IMergeTreeDataPartWriter.cpp    | 11 +++--
 .../MergeTree/IMergeTreeDataPartWriter.h      |  6 +--
 .../MergeTree/MergeTreeDataMergerMutator.cpp  | 41 +++++++++++++------
 .../MergeTree/MergeTreeDataMergerMutator.h    |  6 ++-
 .../MergeTreeDataPartWriterCompact.cpp        |  4 +-
 .../MergeTreeDataPartWriterCompact.h          |  2 +-
 .../MergeTree/MergeTreeDataPartWriterWide.cpp |  4 +-
 .../MergeTree/MergeTreeDataPartWriterWide.h   |  2 +-
 .../MergeTree/MergeTreeDataWriter.cpp         |  7 +++-
 src/Storages/MergeTree/MergeTreeSettings.h    |  3 ++
 .../MergeTree/MergedBlockOutputStream.cpp     |  7 ++--
 .../MergeTree/MergedBlockOutputStream.h       |  1 +
 .../MergedColumnOnlyOutputStream.cpp          |  9 ++--
 .../MergeTree/MergedColumnOnlyOutputStream.h  |  2 +-
 21 files changed, 108 insertions(+), 33 deletions(-)

diff --git a/src/Disks/DiskLocal.cpp b/src/Disks/DiskLocal.cpp
index 68f5ee99a7a..c67bac7ffe2 100644
--- a/src/Disks/DiskLocal.cpp
+++ b/src/Disks/DiskLocal.cpp
@@ -8,7 +8,7 @@
 
 #include <IO/createReadBufferFromFileBase.h>
 #include <IO/createWriteBufferFromFileBase.h>
-
+#include <unistd.h>
 
 namespace DB
 {
@@ -19,6 +19,9 @@ namespace ErrorCodes
     extern const int EXCESSIVE_ELEMENT_IN_CONFIG;
     extern const int PATH_ACCESS_DENIED;
     extern const int INCORRECT_DISK_INDEX;
+    extern const int FILE_DOESNT_EXIST;
+    extern const int CANNOT_OPEN_FILE;
+    extern const int CANNOT_FSYNC;
 }
 
 std::mutex DiskLocal::reservation_mutex;
@@ -188,6 +191,18 @@ void DiskLocal::moveDirectory(const String & from_path, const String & to_path)
     Poco::File(disk_path + from_path).renameTo(disk_path + to_path);
 }
 
+void DiskLocal::sync(const String & path) const
+{
+    String full_path = disk_path + path;
+    int fd = ::open(full_path.c_str(), O_RDONLY);
+    if (-1 == fd)
+        throwFromErrnoWithPath("Cannot open file " + full_path, full_path,
+                               errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+
+    if (-1 == fsync(fd))
+        throwFromErrnoWithPath("Cannot fsync " + full_path, full_path, ErrorCodes::CANNOT_FSYNC);
+}
+
 DiskDirectoryIteratorPtr DiskLocal::iterateDirectory(const String & path)
 {
     return std::make_unique<DiskLocalDirectoryIterator>(disk_path, path);
diff --git a/src/Disks/DiskLocal.h b/src/Disks/DiskLocal.h
index 61a3994b655..743ba2ceb10 100644
--- a/src/Disks/DiskLocal.h
+++ b/src/Disks/DiskLocal.h
@@ -59,6 +59,8 @@ public:
 
     void moveDirectory(const String & from_path, const String & to_path) override;
 
+    void sync(const String & path) const override;
+
     DiskDirectoryIteratorPtr iterateDirectory(const String & path) override;
 
     void createFile(const String & path) override;
diff --git a/src/Disks/DiskMemory.cpp b/src/Disks/DiskMemory.cpp
index 3e43d159ba5..5b3350e40f7 100644
--- a/src/Disks/DiskMemory.cpp
+++ b/src/Disks/DiskMemory.cpp
@@ -261,6 +261,11 @@ void DiskMemory::moveDirectory(const String & /*from_path*/, const String & /*to
     throw Exception("Method moveDirectory is not implemented for memory disks", ErrorCodes::NOT_IMPLEMENTED);
 }
 
+void DiskMemory::sync(const String & /*path*/) const
+{
+    throw Exception("Method sync is not implemented for memory disks", ErrorCodes::NOT_IMPLEMENTED);
+}
+
 DiskDirectoryIteratorPtr DiskMemory::iterateDirectory(const String & path)
 {
     std::lock_guard lock(mutex);
diff --git a/src/Disks/DiskMemory.h b/src/Disks/DiskMemory.h
index b0c1d30c61d..8a3ddf05aa7 100644
--- a/src/Disks/DiskMemory.h
+++ b/src/Disks/DiskMemory.h
@@ -52,6 +52,8 @@ public:
 
     void moveDirectory(const String & from_path, const String & to_path) override;
 
+    void sync(const String & path) const override;
+
     DiskDirectoryIteratorPtr iterateDirectory(const String & path) override;
 
     void createFile(const String & path) override;
diff --git a/src/Disks/IDisk.h b/src/Disks/IDisk.h
index 011c75402f4..8de77a560d1 100644
--- a/src/Disks/IDisk.h
+++ b/src/Disks/IDisk.h
@@ -105,6 +105,9 @@ public:
     /// Move directory from `from_path` to `to_path`.
     virtual void moveDirectory(const String & from_path, const String & to_path) = 0;
 
+    /// Do fsync on directory.
+    virtual void sync(const String & path) const = 0;
+
     /// Return iterator to the contents of the specified directory.
     virtual DiskDirectoryIteratorPtr iterateDirectory(const String & path) = 0;
 
diff --git a/src/Disks/S3/DiskS3.cpp b/src/Disks/S3/DiskS3.cpp
index 71b5991f770..292f6567df4 100644
--- a/src/Disks/S3/DiskS3.cpp
+++ b/src/Disks/S3/DiskS3.cpp
@@ -466,6 +466,11 @@ void DiskS3::clearDirectory(const String & path)
             remove(it->path());
 }
 
+void DiskS3::sync(const String & /*path*/) const
+{
+    throw Exception("Method sync is not implemented for S3 disks", ErrorCodes::NOT_IMPLEMENTED);
+}
+
 void DiskS3::moveFile(const String & from_path, const String & to_path)
 {
     if (exists(to_path))
diff --git a/src/Disks/S3/DiskS3.h b/src/Disks/S3/DiskS3.h
index 5fa8e8358a6..09132367ae8 100644
--- a/src/Disks/S3/DiskS3.h
+++ b/src/Disks/S3/DiskS3.h
@@ -58,6 +58,8 @@ public:
 
     void moveDirectory(const String & from_path, const String & to_path) override { moveFile(from_path, to_path); }
 
+    void sync(const String & path) const override;
+
     DiskDirectoryIteratorPtr iterateDirectory(const String & path) override;
 
     void moveFile(const String & from_path, const String & to_path) override;
diff --git a/src/Storages/MergeTree/IMergeTreeDataPartWriter.cpp b/src/Storages/MergeTree/IMergeTreeDataPartWriter.cpp
index 73ac7fc0064..03ae2166504 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPartWriter.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPartWriter.cpp
@@ -308,7 +308,8 @@ void IMergeTreeDataPartWriter::calculateAndSerializeSkipIndices(
     skip_index_data_mark = skip_index_current_data_mark;
 }
 
-void IMergeTreeDataPartWriter::finishPrimaryIndexSerialization(MergeTreeData::DataPart::Checksums & checksums)
+void IMergeTreeDataPartWriter::finishPrimaryIndexSerialization(
+    MergeTreeData::DataPart::Checksums & checksums, bool sync)
 {
     bool write_final_mark = (with_final_mark && data_written);
     if (write_final_mark && compute_granularity)
@@ -330,12 +331,14 @@ void IMergeTreeDataPartWriter::finishPrimaryIndexSerialization(MergeTreeData::Da
         index_stream->next();
         checksums.files["primary.idx"].file_size = index_stream->count();
         checksums.files["primary.idx"].file_hash = index_stream->getHash();
-        index_stream = nullptr;
+        if (sync)
+            index_stream->sync();
+        index_stream.reset();
     }
 }
 
 void IMergeTreeDataPartWriter::finishSkipIndicesSerialization(
-        MergeTreeData::DataPart::Checksums & checksums)
+        MergeTreeData::DataPart::Checksums & checksums, bool sync)
 {
     for (size_t i = 0; i < skip_indices.size(); ++i)
     {
@@ -348,6 +351,8 @@ void IMergeTreeDataPartWriter::finishSkipIndicesSerialization(
     {
         stream->finalize();
         stream->addToChecksums(checksums);
+        if (sync)
+            stream->sync();
     }
 
     skip_indices_streams.clear();
diff --git a/src/Storages/MergeTree/IMergeTreeDataPartWriter.h b/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
index 2f849e7c895..eebdb880a66 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
@@ -102,9 +102,9 @@ public:
     void initSkipIndices();
     void initPrimaryIndex();
 
-    virtual void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums) = 0;
-    void finishPrimaryIndexSerialization(MergeTreeData::DataPart::Checksums & checksums);
-    void finishSkipIndicesSerialization(MergeTreeData::DataPart::Checksums & checksums);
+    virtual void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums, bool sync) = 0;
+    void finishPrimaryIndexSerialization(MergeTreeData::DataPart::Checksums & checksums, bool sync);
+    void finishSkipIndicesSerialization(MergeTreeData::DataPart::Checksums & checksum, bool sync);
 
 protected:
     /// Count index_granularity for block and store in `index_granularity`
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index 00830dd78c2..ccd7f234925 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -576,6 +576,13 @@ public:
     }
 };
 
+static bool needSyncPart(const size_t input_rows, size_t input_bytes, const MergeTreeSettings & settings)
+{
+    return ((settings.min_rows_to_sync_after_merge && input_rows >= settings.min_rows_to_sync_after_merge)
+        || (settings.min_compressed_bytes_to_sync_after_merge && input_bytes >= settings.min_compressed_bytes_to_sync_after_merge));
+}
+
+
 /// parts should be sorted.
 MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTemporaryPart(
     const FutureMergedMutatedPart & future_part,
@@ -648,6 +655,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
     }
 
     size_t sum_input_rows_upper_bound = merge_entry->total_rows_count;
+    size_t sum_compressed_bytes_upper_bound = merge_entry->total_size_bytes_compressed;
     MergeAlgorithm merge_alg = chooseMergeAlgorithm(parts, sum_input_rows_upper_bound, gathering_columns, deduplicate, need_remove_expired_values);
 
     LOG_DEBUG(log, "Selected MergeAlgorithm: {}", ((merge_alg == MergeAlgorithm::Vertical) ? "Vertical" : "Horizontal"));
@@ -803,7 +811,6 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
     if (need_remove_expired_values)
         merged_stream = std::make_shared<TTLBlockInputStream>(merged_stream, data, metadata_snapshot, new_data_part, time_of_merge, force_ttl);
 
-
     if (metadata_snapshot->hasSecondaryIndices())
     {
         const auto & indices = metadata_snapshot->getSecondaryIndices();
@@ -863,6 +870,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
     if (need_remove_expired_values && ttl_merges_blocker.isCancelled())
         throw Exception("Cancelled merging parts with expired TTL", ErrorCodes::ABORTED);
 
+    bool need_sync = needSyncPart(sum_input_rows_upper_bound, sum_compressed_bytes_upper_bound, *data_settings);
     MergeTreeData::DataPart::Checksums checksums_gathered_columns;
 
     /// Gather ordinary columns
@@ -942,7 +950,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
                 throw Exception("Cancelled merging parts", ErrorCodes::ABORTED);
 
             column_gathered_stream.readSuffix();
-            auto changed_checksums = column_to.writeSuffixAndGetChecksums(new_data_part, checksums_gathered_columns);
+            auto changed_checksums = column_to.writeSuffixAndGetChecksums(new_data_part, checksums_gathered_columns, need_sync);
             checksums_gathered_columns.add(std::move(changed_checksums));
 
             if (rows_written != column_elems_written)
@@ -979,9 +987,12 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
     }
 
     if (merge_alg != MergeAlgorithm::Vertical)
-        to.writeSuffixAndFinalizePart(new_data_part);
+        to.writeSuffixAndFinalizePart(new_data_part, need_sync);
     else
-        to.writeSuffixAndFinalizePart(new_data_part, &storage_columns, &checksums_gathered_columns);
+        to.writeSuffixAndFinalizePart(new_data_part, need_sync, &storage_columns, &checksums_gathered_columns);
+
+    if (need_sync)
+        new_data_part->volume->getDisk()->sync(new_part_tmp_path);
 
     return new_data_part;
 }
@@ -1081,7 +1092,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
     /// Don't change granularity type while mutating subset of columns
     auto mrk_extension = source_part->index_granularity_info.is_adaptive ? getAdaptiveMrkExtension(new_data_part->getType())
                                                                          : getNonAdaptiveMrkExtension();
-
+    bool need_sync = needSyncPart(source_part->rows_count, source_part->getBytesOnDisk(), *data_settings);
     bool need_remove_expired_values = false;
 
     if (in && shouldExecuteTTL(metadata_snapshot, in->getHeader().getNamesAndTypesList().getNames(), commands_for_part))
@@ -1099,7 +1110,8 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
             time_of_mutation,
             compression_codec,
             merge_entry,
-            need_remove_expired_values);
+            need_remove_expired_values,
+            need_sync);
 
         /// no finalization required, because mutateAllPartColumns use
         /// MergedBlockOutputStream which finilaze all part fields itself
@@ -1154,7 +1166,8 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
                 time_of_mutation,
                 compression_codec,
                 merge_entry,
-                need_remove_expired_values);
+                need_remove_expired_values,
+                need_sync);
         }
 
         for (const auto & [rename_from, rename_to] : files_to_rename)
@@ -1174,6 +1187,9 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
         finalizeMutatedPart(source_part, new_data_part, need_remove_expired_values);
     }
 
+    if (need_sync)
+        new_data_part->volume->getDisk()->sync(new_part_tmp_path);
+
     return new_data_part;
 }
 
@@ -1599,7 +1615,8 @@ void MergeTreeDataMergerMutator::mutateAllPartColumns(
     time_t time_of_mutation,
     const CompressionCodecPtr & compression_codec,
     MergeListEntry & merge_entry,
-    bool need_remove_expired_values) const
+    bool need_remove_expired_values,
+    bool need_sync) const
 {
     if (mutating_stream == nullptr)
         throw Exception("Cannot mutate part columns with uninitialized mutations stream. It's a bug", ErrorCodes::LOGICAL_ERROR);
@@ -1637,7 +1654,7 @@ void MergeTreeDataMergerMutator::mutateAllPartColumns(
     new_data_part->minmax_idx = std::move(minmax_idx);
 
     mutating_stream->readSuffix();
-    out.writeSuffixAndFinalizePart(new_data_part);
+    out.writeSuffixAndFinalizePart(new_data_part, need_sync);
 }
 
 void MergeTreeDataMergerMutator::mutateSomePartColumns(
@@ -1650,7 +1667,8 @@ void MergeTreeDataMergerMutator::mutateSomePartColumns(
     time_t time_of_mutation,
     const CompressionCodecPtr & compression_codec,
     MergeListEntry & merge_entry,
-    bool need_remove_expired_values) const
+    bool need_remove_expired_values,
+    bool need_sync) const
 {
     if (mutating_stream == nullptr)
         throw Exception("Cannot mutate part columns with uninitialized mutations stream. It's a bug", ErrorCodes::LOGICAL_ERROR);
@@ -1684,10 +1702,9 @@ void MergeTreeDataMergerMutator::mutateSomePartColumns(
 
     mutating_stream->readSuffix();
 
-    auto changed_checksums = out.writeSuffixAndGetChecksums(new_data_part, new_data_part->checksums);
+    auto changed_checksums = out.writeSuffixAndGetChecksums(new_data_part, new_data_part->checksums, need_sync);
 
     new_data_part->checksums.add(std::move(changed_checksums));
-
 }
 
 void MergeTreeDataMergerMutator::finalizeMutatedPart(
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
index 121cc770d51..23b8d7f681b 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
@@ -189,7 +189,8 @@ private:
         time_t time_of_mutation,
         const CompressionCodecPtr & codec,
         MergeListEntry & merge_entry,
-        bool need_remove_expired_values) const;
+        bool need_remove_expired_values,
+        bool need_sync) const;
 
     /// Mutate some columns of source part with mutation_stream
     void mutateSomePartColumns(
@@ -202,7 +203,8 @@ private:
         time_t time_of_mutation,
         const CompressionCodecPtr & codec,
         MergeListEntry & merge_entry,
-        bool need_remove_expired_values) const;
+        bool need_remove_expired_values,
+        bool need_sync) const;
 
     /// Initialize and write to disk new part fields like checksums, columns,
     /// etc.
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
index f7a3ad75cf5..79800204a3b 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
@@ -141,7 +141,7 @@ void MergeTreeDataPartWriterCompact::writeColumnSingleGranule(const ColumnWithTy
     column.type->serializeBinaryBulkStateSuffix(serialize_settings, state);
 }
 
-void MergeTreeDataPartWriterCompact::finishDataSerialization(IMergeTreeDataPart::Checksums & checksums)
+void MergeTreeDataPartWriterCompact::finishDataSerialization(IMergeTreeDataPart::Checksums & checksums, bool sync)
 {
     if (columns_buffer.size() != 0)
         writeBlock(header.cloneWithColumns(columns_buffer.releaseColumns()));
@@ -158,6 +158,8 @@ void MergeTreeDataPartWriterCompact::finishDataSerialization(IMergeTreeDataPart:
 
     stream->finalize();
     stream->addToChecksums(checksums);
+    if (sync)
+        stream->sync();
     stream.reset();
 }
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.h b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.h
index 8183c038c4c..dde7deafc58 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.h
@@ -20,7 +20,7 @@ public:
     void write(const Block & block, const IColumn::Permutation * permutation,
         const Block & primary_key_block, const Block & skip_indexes_block) override;
 
-    void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums) override;
+    void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums, bool sync) override;
 
 protected:
     void fillIndexGranularity(size_t index_granularity_for_block, size_t rows_in_block) override;
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
index e71ea4d4b94..fcd0249b10c 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
@@ -264,7 +264,7 @@ void MergeTreeDataPartWriterWide::writeColumn(
     next_index_offset = current_row - total_rows;
 }
 
-void MergeTreeDataPartWriterWide::finishDataSerialization(IMergeTreeDataPart::Checksums & checksums)
+void MergeTreeDataPartWriterWide::finishDataSerialization(IMergeTreeDataPart::Checksums & checksums, bool sync)
 {
     const auto & global_settings = storage.global_context.getSettingsRef();
     IDataType::SerializeBinaryBulkSettings serialize_settings;
@@ -295,6 +295,8 @@ void MergeTreeDataPartWriterWide::finishDataSerialization(IMergeTreeDataPart::Ch
     {
         stream.second->finalize();
         stream.second->addToChecksums(checksums);
+        if (sync)
+            stream.second->sync();
     }
 
     column_streams.clear();
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
index f5a9d17f63c..4286065a3ca 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
@@ -23,7 +23,7 @@ public:
     void write(const Block & block, const IColumn::Permutation * permutation,
         const Block & primary_key_block, const Block & skip_indexes_block) override;
 
-    void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums) override;
+    void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums, bool sync) override;
 
     IDataType::OutputStreamGetter createStreamGetter(const String & name, WrittenOffsetColumns & offset_columns);
 
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index 099480aca2f..cf8860b7f04 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -303,10 +303,15 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeTempPart(BlockWithPa
 
     const auto & index_factory = MergeTreeIndexFactory::instance();
     MergedBlockOutputStream out(new_data_part, metadata_snapshot, columns, index_factory.getMany(metadata_snapshot->getSecondaryIndices()), compression_codec);
+    bool sync_on_insert = data.getSettings()->sync_after_insert;
 
     out.writePrefix();
     out.writeWithPermutation(block, perm_ptr);
-    out.writeSuffixAndFinalizePart(new_data_part);
+    out.writeSuffixAndFinalizePart(new_data_part, sync_on_insert);
+
+    /// Sync part directory.
+    if (sync_on_insert)
+        new_data_part->volume->getDisk()->sync(full_path);
 
     ProfileEvents::increment(ProfileEvents::MergeTreeDataWriterRows, block.rows());
     ProfileEvents::increment(ProfileEvents::MergeTreeDataWriterUncompressedBytes, block.bytes());
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index f2d2a7cc3d4..da2c9ee49ee 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -43,6 +43,9 @@ struct MergeTreeSettings : public SettingsCollection<MergeTreeSettings>
     M(SettingSeconds, old_parts_lifetime, 8 * 60, "How many seconds to keep obsolete parts.", 0) \
     M(SettingSeconds, temporary_directories_lifetime, 86400, "How many seconds to keep tmp_-directories.", 0) \
     M(SettingSeconds, lock_acquire_timeout_for_background_operations, DBMS_DEFAULT_LOCK_ACQUIRE_TIMEOUT_SEC, "For background operations like merges, mutations etc. How many seconds before failing to acquire table locks.", 0) \
+    M(SettingUInt64, min_rows_to_sync_after_merge, 0, "Minimal number of rows to do fsync for part after merge (0 - disabled)", 0) \
+    M(SettingUInt64, min_compressed_bytes_to_sync_after_merge, 0, "Minimal number of compressed bytes to do fsync for part after merge (0 - disabled)", 0) \
+    M(SettingBool, sync_after_insert, false, "Do fsync for every inserted part. Significantly decreases performance of inserts, not recommended to use with wide parts.", 0) \
     \
     /** Inserts settings. */ \
     M(SettingUInt64, parts_to_delay_insert, 150, "If table contains at least that many active parts in single partition, artificially slow down insert into table.", 0) \
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index e776a35f21f..5e15084aa7d 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -85,6 +85,7 @@ void MergedBlockOutputStream::writeSuffix()
 
 void MergedBlockOutputStream::writeSuffixAndFinalizePart(
         MergeTreeData::MutableDataPartPtr & new_part,
+        bool sync,
         const NamesAndTypesList * total_columns_list,
         MergeTreeData::DataPart::Checksums * additional_column_checksums)
 {
@@ -95,9 +96,9 @@ void MergedBlockOutputStream::writeSuffixAndFinalizePart(
         checksums = std::move(*additional_column_checksums);
 
     /// Finish columns serialization.
-    writer->finishDataSerialization(checksums);
-    writer->finishPrimaryIndexSerialization(checksums);
-    writer->finishSkipIndicesSerialization(checksums);
+    writer->finishDataSerialization(checksums, sync);
+    writer->finishPrimaryIndexSerialization(checksums, sync);
+    writer->finishSkipIndicesSerialization(checksums, sync);
 
     NamesAndTypesList part_columns;
     if (!total_columns_list)
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.h b/src/Storages/MergeTree/MergedBlockOutputStream.h
index 1a8bf9da822..002ef78a9af 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.h
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.h
@@ -46,6 +46,7 @@ public:
     /// Finilize writing part and fill inner structures
     void writeSuffixAndFinalizePart(
             MergeTreeData::MutableDataPartPtr & new_part,
+            bool sync = false,
             const NamesAndTypesList * total_columns_list = nullptr,
             MergeTreeData::DataPart::Checksums * additional_column_checksums = nullptr);
 
diff --git a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
index 1faadd0d720..e767fb3f155 100644
--- a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
@@ -63,12 +63,15 @@ void MergedColumnOnlyOutputStream::writeSuffix()
 }
 
 MergeTreeData::DataPart::Checksums
-MergedColumnOnlyOutputStream::writeSuffixAndGetChecksums(MergeTreeData::MutableDataPartPtr & new_part, MergeTreeData::DataPart::Checksums & all_checksums)
+MergedColumnOnlyOutputStream::writeSuffixAndGetChecksums(
+    MergeTreeData::MutableDataPartPtr & new_part,
+    MergeTreeData::DataPart::Checksums & all_checksums,
+    bool sync)
 {
     /// Finish columns serialization.
     MergeTreeData::DataPart::Checksums checksums;
-    writer->finishDataSerialization(checksums);
-    writer->finishSkipIndicesSerialization(checksums);
+    writer->finishDataSerialization(checksums, sync);
+    writer->finishSkipIndicesSerialization(checksums, sync);
 
     auto columns = new_part->getColumns();
 
diff --git a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
index 902138ced9d..507a964ede0 100644
--- a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
+++ b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
@@ -27,7 +27,7 @@ public:
     void write(const Block & block) override;
     void writeSuffix() override;
     MergeTreeData::DataPart::Checksums
-    writeSuffixAndGetChecksums(MergeTreeData::MutableDataPartPtr & new_part, MergeTreeData::DataPart::Checksums & all_checksums);
+    writeSuffixAndGetChecksums(MergeTreeData::MutableDataPartPtr & new_part, MergeTreeData::DataPart::Checksums & all_checksums, bool sync = false);
 
 private:
     Block header;

From b2aa565a37076230af2ceaa32ee21fa351d37931 Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Sat, 27 Jun 2020 00:55:48 +0300
Subject: [PATCH 002/341] allow to turn on fsync on inserts, merges and fetches

---
 src/Common/FileSyncGuard.h                    | 41 +++++++++++++++++++
 src/Disks/DiskLocal.cpp                       | 35 ++++++++++------
 src/Disks/DiskLocal.h                         |  6 ++-
 src/Disks/DiskMemory.cpp                      | 20 ++++++---
 src/Disks/DiskMemory.h                        |  6 ++-
 src/Disks/IDisk.h                             | 12 ++++--
 src/Disks/S3/DiskS3.cpp                       | 21 +++++++---
 src/Disks/S3/DiskS3.h                         |  6 ++-
 src/Storages/MergeTree/DataPartsExchange.cpp  | 16 +++++++-
 src/Storages/MergeTree/DataPartsExchange.h    |  1 +
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  5 +++
 .../MergeTree/MergeTreeDataMergerMutator.cpp  | 15 ++++---
 .../MergeTree/MergeTreeDataWriter.cpp         | 12 +++---
 src/Storages/MergeTree/MergeTreeSettings.h    |  2 +
 14 files changed, 154 insertions(+), 44 deletions(-)
 create mode 100644 src/Common/FileSyncGuard.h

diff --git a/src/Common/FileSyncGuard.h b/src/Common/FileSyncGuard.h
new file mode 100644
index 00000000000..5ec9b1d0c98
--- /dev/null
+++ b/src/Common/FileSyncGuard.h
@@ -0,0 +1,41 @@
+#pragma once
+
+#include <Disks/IDisk.h>
+
+namespace DB
+{
+
+/// Helper class, that recieves file descriptor and does fsync for it in destructor.
+/// It's used to keep descriptor open, while doing some operations with it, and do fsync at the end.
+/// Guaranties of sequence 'close-reopen-fsync' may depend on kernel version.
+/// Source: linux-fsdevel mailing-list https://marc.info/?l=linux-fsdevel&m=152535409207496
+class FileSyncGuard
+{
+public:
+    /// NOTE: If you have already opened descriptor, it's preffered to use
+    /// this constructor instead of construnctor with path.
+    FileSyncGuard(const DiskPtr & disk_, int fd_) : disk(disk_), fd(fd_) {}
+
+    FileSyncGuard(const DiskPtr & disk_, const String & path)
+        : disk(disk_), fd(disk_->open(path, O_RDONLY)) {}
+
+    ~FileSyncGuard()
+    {
+        try
+        {
+            disk->sync(fd);
+            disk->close(fd);
+        }
+        catch (...)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+        }
+    }
+
+private:
+    DiskPtr disk;
+    int fd = -1;
+};
+
+}
+
diff --git a/src/Disks/DiskLocal.cpp b/src/Disks/DiskLocal.cpp
index c67bac7ffe2..f85b69baf5e 100644
--- a/src/Disks/DiskLocal.cpp
+++ b/src/Disks/DiskLocal.cpp
@@ -22,6 +22,7 @@ namespace ErrorCodes
     extern const int FILE_DOESNT_EXIST;
     extern const int CANNOT_OPEN_FILE;
     extern const int CANNOT_FSYNC;
+    extern const int CANNOT_CLOSE_FILE;
 }
 
 std::mutex DiskLocal::reservation_mutex;
@@ -191,18 +192,6 @@ void DiskLocal::moveDirectory(const String & from_path, const String & to_path)
     Poco::File(disk_path + from_path).renameTo(disk_path + to_path);
 }
 
-void DiskLocal::sync(const String & path) const
-{
-    String full_path = disk_path + path;
-    int fd = ::open(full_path.c_str(), O_RDONLY);
-    if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + full_path, full_path,
-                               errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
-
-    if (-1 == fsync(fd))
-        throwFromErrnoWithPath("Cannot fsync " + full_path, full_path, ErrorCodes::CANNOT_FSYNC);
-}
-
 DiskDirectoryIteratorPtr DiskLocal::iterateDirectory(const String & path)
 {
     return std::make_unique<DiskLocalDirectoryIterator>(disk_path, path);
@@ -299,6 +288,28 @@ void DiskLocal::copy(const String & from_path, const std::shared_ptr<IDisk> & to
         IDisk::copy(from_path, to_disk, to_path); /// Copy files through buffers.
 }
 
+int DiskLocal::open(const String & path, mode_t mode) const
+{
+    String full_path = disk_path + path;
+    int fd = ::open(full_path.c_str(), mode);
+    if (-1 == fd)
+        throwFromErrnoWithPath("Cannot open file " + full_path, full_path,
+                        errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+    return fd;
+}
+
+void DiskLocal::close(int fd) const
+{
+    if (-1 == ::close(fd))
+        throw Exception("Cannot close file", ErrorCodes::CANNOT_CLOSE_FILE);
+}
+
+void DiskLocal::sync(int fd) const
+{
+    if (-1 == ::fsync(fd))
+        throw Exception("Cannot fsync", ErrorCodes::CANNOT_FSYNC);
+}
+
 DiskPtr DiskLocalReservation::getDisk(size_t i) const
 {
     if (i != 0)
diff --git a/src/Disks/DiskLocal.h b/src/Disks/DiskLocal.h
index 743ba2ceb10..d70ac06c18b 100644
--- a/src/Disks/DiskLocal.h
+++ b/src/Disks/DiskLocal.h
@@ -59,8 +59,6 @@ public:
 
     void moveDirectory(const String & from_path, const String & to_path) override;
 
-    void sync(const String & path) const override;
-
     DiskDirectoryIteratorPtr iterateDirectory(const String & path) override;
 
     void createFile(const String & path) override;
@@ -101,6 +99,10 @@ public:
 
     void createHardLink(const String & src_path, const String & dst_path) override;
 
+    int open(const String & path, mode_t mode) const override;
+    void close(int fd) const override;
+    void sync(int fd) const override;
+
 private:
     bool tryReserve(UInt64 bytes);
 
diff --git a/src/Disks/DiskMemory.cpp b/src/Disks/DiskMemory.cpp
index 5b3350e40f7..a7f1df04e1f 100644
--- a/src/Disks/DiskMemory.cpp
+++ b/src/Disks/DiskMemory.cpp
@@ -261,11 +261,6 @@ void DiskMemory::moveDirectory(const String & /*from_path*/, const String & /*to
     throw Exception("Method moveDirectory is not implemented for memory disks", ErrorCodes::NOT_IMPLEMENTED);
 }
 
-void DiskMemory::sync(const String & /*path*/) const
-{
-    throw Exception("Method sync is not implemented for memory disks", ErrorCodes::NOT_IMPLEMENTED);
-}
-
 DiskDirectoryIteratorPtr DiskMemory::iterateDirectory(const String & path)
 {
     std::lock_guard lock(mutex);
@@ -413,6 +408,21 @@ void DiskMemory::setReadOnly(const String &)
     throw Exception("Method setReadOnly is not implemented for memory disks", ErrorCodes::NOT_IMPLEMENTED);
 }
 
+int DiskMemory::open(const String & /*path*/, mode_t /*mode*/) const
+{
+    throw Exception("Method open is not implemented for memory disks", ErrorCodes::NOT_IMPLEMENTED);
+}
+
+void DiskMemory::close(int /*fd*/) const
+{
+    throw Exception("Method close is not implemented for memory disks", ErrorCodes::NOT_IMPLEMENTED);
+}
+
+void DiskMemory::sync(int /*fd*/) const
+{
+    throw Exception("Method sync is not implemented for memory disks", ErrorCodes::NOT_IMPLEMENTED);
+}
+
 
 using DiskMemoryPtr = std::shared_ptr<DiskMemory>;
 
diff --git a/src/Disks/DiskMemory.h b/src/Disks/DiskMemory.h
index 8a3ddf05aa7..7f111fe5e7d 100644
--- a/src/Disks/DiskMemory.h
+++ b/src/Disks/DiskMemory.h
@@ -52,8 +52,6 @@ public:
 
     void moveDirectory(const String & from_path, const String & to_path) override;
 
-    void sync(const String & path) const override;
-
     DiskDirectoryIteratorPtr iterateDirectory(const String & path) override;
 
     void createFile(const String & path) override;
@@ -92,6 +90,10 @@ public:
 
     void createHardLink(const String & src_path, const String & dst_path) override;
 
+    int open(const String & path, mode_t mode) const override;
+    void close(int fd) const override;
+    void sync(int fd) const override;
+
 private:
     void createDirectoriesImpl(const String & path);
     void replaceFileImpl(const String & from_path, const String & to_path);
diff --git a/src/Disks/IDisk.h b/src/Disks/IDisk.h
index 8de77a560d1..bc5c9381643 100644
--- a/src/Disks/IDisk.h
+++ b/src/Disks/IDisk.h
@@ -105,9 +105,6 @@ public:
     /// Move directory from `from_path` to `to_path`.
     virtual void moveDirectory(const String & from_path, const String & to_path) = 0;
 
-    /// Do fsync on directory.
-    virtual void sync(const String & path) const = 0;
-
     /// Return iterator to the contents of the specified directory.
     virtual DiskDirectoryIteratorPtr iterateDirectory(const String & path) = 0;
 
@@ -174,6 +171,15 @@ public:
 
     /// Create hardlink from `src_path` to `dst_path`.
     virtual void createHardLink(const String & src_path, const String & dst_path) = 0;
+
+    /// Wrapper for POSIX open
+    virtual int open(const String & path, mode_t mode) const = 0;
+
+    /// Wrapper for POSIX close
+    virtual void close(int fd) const = 0;
+
+    /// Wrapper for POSIX fsync
+    virtual void sync(int fd) const = 0;
 };
 
 using DiskPtr = std::shared_ptr<IDisk>;
diff --git a/src/Disks/S3/DiskS3.cpp b/src/Disks/S3/DiskS3.cpp
index 292f6567df4..3e0fb05ed6f 100644
--- a/src/Disks/S3/DiskS3.cpp
+++ b/src/Disks/S3/DiskS3.cpp
@@ -29,6 +29,7 @@ namespace ErrorCodes
     extern const int CANNOT_SEEK_THROUGH_FILE;
     extern const int UNKNOWN_FORMAT;
     extern const int INCORRECT_DISK_INDEX;
+    extern const int NOT_IMPLEMENTED;
 }
 
 namespace
@@ -466,11 +467,6 @@ void DiskS3::clearDirectory(const String & path)
             remove(it->path());
 }
 
-void DiskS3::sync(const String & /*path*/) const
-{
-    throw Exception("Method sync is not implemented for S3 disks", ErrorCodes::NOT_IMPLEMENTED);
-}
-
 void DiskS3::moveFile(const String & from_path, const String & to_path)
 {
     if (exists(to_path))
@@ -669,6 +665,21 @@ void DiskS3::setReadOnly(const String & path)
     Poco::File(metadata_path + path).setReadOnly(true);
 }
 
+int DiskS3::open(const String & /*path*/, mode_t /*mode*/) const
+{
+    throw Exception("Method open is not implemented for S3 disks", ErrorCodes::NOT_IMPLEMENTED);
+}
+
+void DiskS3::close(int /*fd*/) const
+{
+    throw Exception("Method close is not implemented for S3 disks", ErrorCodes::NOT_IMPLEMENTED);
+}
+
+void DiskS3::sync(int /*fd*/) const
+{
+    throw Exception("Method sync is not implemented for S3 disks", ErrorCodes::NOT_IMPLEMENTED);
+}
+
 DiskS3Reservation::~DiskS3Reservation()
 {
     try
diff --git a/src/Disks/S3/DiskS3.h b/src/Disks/S3/DiskS3.h
index 09132367ae8..cbf161da561 100644
--- a/src/Disks/S3/DiskS3.h
+++ b/src/Disks/S3/DiskS3.h
@@ -58,8 +58,6 @@ public:
 
     void moveDirectory(const String & from_path, const String & to_path) override { moveFile(from_path, to_path); }
 
-    void sync(const String & path) const override;
-
     DiskDirectoryIteratorPtr iterateDirectory(const String & path) override;
 
     void moveFile(const String & from_path, const String & to_path) override;
@@ -98,6 +96,10 @@ public:
 
     void setReadOnly(const String & path) override;
 
+    int open(const String & path, mode_t mode) const override;
+    void close(int fd) const override;
+    void sync(int fd) const override;
+
 private:
     bool tryReserve(UInt64 bytes);
 
diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index 6796e630ff2..e7bb8206cd9 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -2,6 +2,7 @@
 #include <Disks/createVolume.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/NetException.h>
+#include <Common/FileSyncGuard.h>
 #include <IO/HTTPCommon.h>
 #include <ext/scope_guard.h>
 #include <Poco/File.h>
@@ -224,9 +225,9 @@ MergeTreeData::MutableDataPartPtr Fetcher::fetchPart(
     int server_protocol_version = parse<int>(in.getResponseCookie("server_protocol_version", "0"));
 
     ReservationPtr reservation;
+    size_t sum_files_size = 0;
     if (server_protocol_version >= REPLICATION_PROTOCOL_VERSION_WITH_PARTS_SIZE)
     {
-        size_t sum_files_size;
         readBinary(sum_files_size, in);
         if (server_protocol_version >= REPLICATION_PROTOCOL_VERSION_WITH_PARTS_SIZE_AND_TTL_INFOS)
         {
@@ -247,7 +248,10 @@ MergeTreeData::MutableDataPartPtr Fetcher::fetchPart(
         reservation = data.makeEmptyReservationOnLargestDisk();
     }
 
-    return downloadPart(part_name, replica_path, to_detached, tmp_prefix_, std::move(reservation), in);
+    bool sync = (data_settings->min_compressed_bytes_to_sync_after_fetch
+                    && sum_files_size >= data_settings->min_compressed_bytes_to_sync_after_fetch);
+
+    return downloadPart(part_name, replica_path, to_detached, tmp_prefix_, sync, std::move(reservation), in);
 }
 
 MergeTreeData::MutableDataPartPtr Fetcher::downloadPart(
@@ -255,6 +259,7 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPart(
     const String & replica_path,
     bool to_detached,
     const String & tmp_prefix_,
+    bool sync,
     const ReservationPtr reservation,
     PooledReadWriteBufferFromHTTP & in)
 {
@@ -276,6 +281,10 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPart(
 
     disk->createDirectories(part_download_path);
 
+    std::optional<FileSyncGuard> sync_guard;
+    if (data.getSettings()->sync_part_directory)
+        sync_guard.emplace(disk, part_download_path);
+
     MergeTreeData::DataPart::Checksums checksums;
     for (size_t i = 0; i < files; ++i)
     {
@@ -316,6 +325,9 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPart(
         if (file_name != "checksums.txt" &&
             file_name != "columns.txt")
             checksums.addFile(file_name, file_size, expected_hash);
+
+        if (sync)
+            hashing_out.sync();
     }
 
     assertEOF(in);
diff --git a/src/Storages/MergeTree/DataPartsExchange.h b/src/Storages/MergeTree/DataPartsExchange.h
index c1aff6bdba5..e983d6deecf 100644
--- a/src/Storages/MergeTree/DataPartsExchange.h
+++ b/src/Storages/MergeTree/DataPartsExchange.h
@@ -71,6 +71,7 @@ private:
             const String & replica_path,
             bool to_detached,
             const String & tmp_prefix_,
+            bool sync,
             const ReservationPtr reservation,
             PooledReadWriteBufferFromHTTP & in);
 
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 61dfeed6b7c..ab9bb7879aa 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -10,6 +10,7 @@
 #include <Storages/MergeTree/localBackup.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/escapeForFileName.h>
+#include <Common/FileSyncGuard.h>
 #include <common/JSON.h>
 #include <common/logger_useful.h>
 
@@ -664,6 +665,10 @@ void IMergeTreeDataPart::renameTo(const String & new_relative_path, bool remove_
     String from = getFullRelativePath();
     String to = storage.relative_data_path + new_relative_path + "/";
 
+    std::optional<FileSyncGuard> sync_guard;
+    if (storage.getSettings()->sync_part_directory)
+        sync_guard.emplace(volume->getDisk(), to);
+
     if (!volume->getDisk()->exists(from))
         throw Exception("Part directory " + fullPath(volume->getDisk(), from) + " doesn't exist. Most likely it is logical error.", ErrorCodes::FILE_DOESNT_EXIST);
 
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index ccd7f234925..9c8c4e3c1d5 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -30,6 +30,7 @@
 #include <Common/interpolate.h>
 #include <Common/typeid_cast.h>
 #include <Common/escapeForFileName.h>
+#include <Common/FileSyncGuard.h>
 #include <cmath>
 #include <numeric>
 #include <iomanip>
@@ -695,6 +696,10 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
         gathering_column_names.clear();
     }
 
+    std::optional<FileSyncGuard> sync_guard;
+    if (data.getSettings()->sync_part_directory)
+        sync_guard.emplace(disk, new_part_tmp_path);
+
     /** Read from all parts, merge and write into a new one.
       * In passing, we calculate expression for sorting.
       */
@@ -991,9 +996,6 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
     else
         to.writeSuffixAndFinalizePart(new_data_part, need_sync, &storage_columns, &checksums_gathered_columns);
 
-    if (need_sync)
-        new_data_part->volume->getDisk()->sync(new_part_tmp_path);
-
     return new_data_part;
 }
 
@@ -1089,6 +1091,10 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
 
     disk->createDirectories(new_part_tmp_path);
 
+    std::optional<FileSyncGuard> sync_guard;
+    if (data.getSettings()->sync_part_directory)
+        sync_guard.emplace(disk, new_part_tmp_path);
+
     /// Don't change granularity type while mutating subset of columns
     auto mrk_extension = source_part->index_granularity_info.is_adaptive ? getAdaptiveMrkExtension(new_data_part->getType())
                                                                          : getNonAdaptiveMrkExtension();
@@ -1187,9 +1193,6 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
         finalizeMutatedPart(source_part, new_data_part, need_remove_expired_values);
     }
 
-    if (need_sync)
-        new_data_part->volume->getDisk()->sync(new_part_tmp_path);
-
     return new_data_part;
 }
 
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index cf8860b7f04..01f0b086cea 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -12,6 +12,7 @@
 #include <IO/WriteHelpers.h>
 #include <Poco/File.h>
 #include <Common/typeid_cast.h>
+#include <Common/FileSyncGuard.h>
 
 
 namespace ProfileEvents
@@ -259,7 +260,12 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeTempPart(BlockWithPa
         new_data_part->volume->getDisk()->removeRecursive(full_path);
     }
 
-    new_data_part->volume->getDisk()->createDirectories(full_path);
+    const auto disk = new_data_part->volume->getDisk();
+    disk->createDirectories(full_path);
+
+    std::optional<FileSyncGuard> sync_guard;
+    if (data.getSettings()->sync_part_directory)
+        sync_guard.emplace(disk, full_path);
 
     /// If we need to calculate some columns to sort.
     if (metadata_snapshot->hasSortingKey() || metadata_snapshot->hasSecondaryIndices())
@@ -309,10 +315,6 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeTempPart(BlockWithPa
     out.writeWithPermutation(block, perm_ptr);
     out.writeSuffixAndFinalizePart(new_data_part, sync_on_insert);
 
-    /// Sync part directory.
-    if (sync_on_insert)
-        new_data_part->volume->getDisk()->sync(full_path);
-
     ProfileEvents::increment(ProfileEvents::MergeTreeDataWriterRows, block.rows());
     ProfileEvents::increment(ProfileEvents::MergeTreeDataWriterUncompressedBytes, block.bytes());
     ProfileEvents::increment(ProfileEvents::MergeTreeDataWriterCompressedBytes, new_data_part->getBytesOnDisk());
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index da2c9ee49ee..c559ce2804e 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -45,7 +45,9 @@ struct MergeTreeSettings : public SettingsCollection<MergeTreeSettings>
     M(SettingSeconds, lock_acquire_timeout_for_background_operations, DBMS_DEFAULT_LOCK_ACQUIRE_TIMEOUT_SEC, "For background operations like merges, mutations etc. How many seconds before failing to acquire table locks.", 0) \
     M(SettingUInt64, min_rows_to_sync_after_merge, 0, "Minimal number of rows to do fsync for part after merge (0 - disabled)", 0) \
     M(SettingUInt64, min_compressed_bytes_to_sync_after_merge, 0, "Minimal number of compressed bytes to do fsync for part after merge (0 - disabled)", 0) \
+    M(SettingUInt64, min_compressed_bytes_to_sync_after_fetch, 0, "Minimal number of compressed bytes to do fsync for part after fetch (0 - disabled)", 0) \
     M(SettingBool, sync_after_insert, false, "Do fsync for every inserted part. Significantly decreases performance of inserts, not recommended to use with wide parts.", 0) \
+    M(SettingBool, sync_part_directory, false, "Do fsync for part directory after all part operations (writes, renames, etc.).", 0) \
     \
     /** Inserts settings. */ \
     M(SettingUInt64, parts_to_delay_insert, 150, "If table contains at least that many active parts in single partition, artificially slow down insert into table.", 0) \

From ca346ea13cd0ad0f02a29d59302584c826b52298 Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Fri, 3 Jul 2020 02:41:37 +0300
Subject: [PATCH 003/341] rename fsync-related settings

---
 src/Storages/MergeTree/DataPartsExchange.cpp          |  6 +++---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp         |  2 +-
 src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp |  8 ++++----
 src/Storages/MergeTree/MergeTreeDataWriter.cpp        |  4 ++--
 src/Storages/MergeTree/MergeTreeSettings.h            | 10 +++++-----
 5 files changed, 15 insertions(+), 15 deletions(-)

diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index e7bb8206cd9..72b478cf587 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -248,8 +248,8 @@ MergeTreeData::MutableDataPartPtr Fetcher::fetchPart(
         reservation = data.makeEmptyReservationOnLargestDisk();
     }
 
-    bool sync = (data_settings->min_compressed_bytes_to_sync_after_fetch
-                    && sum_files_size >= data_settings->min_compressed_bytes_to_sync_after_fetch);
+    bool sync = (data_settings->min_compressed_bytes_to_fsync_after_fetch
+                    && sum_files_size >= data_settings->min_compressed_bytes_to_fsync_after_fetch);
 
     return downloadPart(part_name, replica_path, to_detached, tmp_prefix_, sync, std::move(reservation), in);
 }
@@ -282,7 +282,7 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPart(
     disk->createDirectories(part_download_path);
 
     std::optional<FileSyncGuard> sync_guard;
-    if (data.getSettings()->sync_part_directory)
+    if (data.getSettings()->fsync_part_directory)
         sync_guard.emplace(disk, part_download_path);
 
     MergeTreeData::DataPart::Checksums checksums;
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index ab9bb7879aa..3d8cb6b7fc5 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -666,7 +666,7 @@ void IMergeTreeDataPart::renameTo(const String & new_relative_path, bool remove_
     String to = storage.relative_data_path + new_relative_path + "/";
 
     std::optional<FileSyncGuard> sync_guard;
-    if (storage.getSettings()->sync_part_directory)
+    if (storage.getSettings()->fsync_part_directory)
         sync_guard.emplace(volume->getDisk(), to);
 
     if (!volume->getDisk()->exists(from))
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index 9c8c4e3c1d5..c39d1981031 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -579,8 +579,8 @@ public:
 
 static bool needSyncPart(const size_t input_rows, size_t input_bytes, const MergeTreeSettings & settings)
 {
-    return ((settings.min_rows_to_sync_after_merge && input_rows >= settings.min_rows_to_sync_after_merge)
-        || (settings.min_compressed_bytes_to_sync_after_merge && input_bytes >= settings.min_compressed_bytes_to_sync_after_merge));
+    return ((settings.min_rows_to_fsync_after_merge && input_rows >= settings.min_rows_to_fsync_after_merge)
+        || (settings.min_compressed_bytes_to_fsync_after_merge && input_bytes >= settings.min_compressed_bytes_to_fsync_after_merge));
 }
 
 
@@ -697,7 +697,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
     }
 
     std::optional<FileSyncGuard> sync_guard;
-    if (data.getSettings()->sync_part_directory)
+    if (data.getSettings()->fsync_part_directory)
         sync_guard.emplace(disk, new_part_tmp_path);
 
     /** Read from all parts, merge and write into a new one.
@@ -1092,7 +1092,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
     disk->createDirectories(new_part_tmp_path);
 
     std::optional<FileSyncGuard> sync_guard;
-    if (data.getSettings()->sync_part_directory)
+    if (data.getSettings()->fsync_part_directory)
         sync_guard.emplace(disk, new_part_tmp_path);
 
     /// Don't change granularity type while mutating subset of columns
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index 01f0b086cea..23210fc604e 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -264,7 +264,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeTempPart(BlockWithPa
     disk->createDirectories(full_path);
 
     std::optional<FileSyncGuard> sync_guard;
-    if (data.getSettings()->sync_part_directory)
+    if (data.getSettings()->fsync_part_directory)
         sync_guard.emplace(disk, full_path);
 
     /// If we need to calculate some columns to sort.
@@ -309,7 +309,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeTempPart(BlockWithPa
 
     const auto & index_factory = MergeTreeIndexFactory::instance();
     MergedBlockOutputStream out(new_data_part, metadata_snapshot, columns, index_factory.getMany(metadata_snapshot->getSecondaryIndices()), compression_codec);
-    bool sync_on_insert = data.getSettings()->sync_after_insert;
+    bool sync_on_insert = data.getSettings()->fsync_after_insert;
 
     out.writePrefix();
     out.writeWithPermutation(block, perm_ptr);
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index c559ce2804e..eeee0c4b1e1 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -43,11 +43,11 @@ struct MergeTreeSettings : public SettingsCollection<MergeTreeSettings>
     M(SettingSeconds, old_parts_lifetime, 8 * 60, "How many seconds to keep obsolete parts.", 0) \
     M(SettingSeconds, temporary_directories_lifetime, 86400, "How many seconds to keep tmp_-directories.", 0) \
     M(SettingSeconds, lock_acquire_timeout_for_background_operations, DBMS_DEFAULT_LOCK_ACQUIRE_TIMEOUT_SEC, "For background operations like merges, mutations etc. How many seconds before failing to acquire table locks.", 0) \
-    M(SettingUInt64, min_rows_to_sync_after_merge, 0, "Minimal number of rows to do fsync for part after merge (0 - disabled)", 0) \
-    M(SettingUInt64, min_compressed_bytes_to_sync_after_merge, 0, "Minimal number of compressed bytes to do fsync for part after merge (0 - disabled)", 0) \
-    M(SettingUInt64, min_compressed_bytes_to_sync_after_fetch, 0, "Minimal number of compressed bytes to do fsync for part after fetch (0 - disabled)", 0) \
-    M(SettingBool, sync_after_insert, false, "Do fsync for every inserted part. Significantly decreases performance of inserts, not recommended to use with wide parts.", 0) \
-    M(SettingBool, sync_part_directory, false, "Do fsync for part directory after all part operations (writes, renames, etc.).", 0) \
+    M(SettingUInt64, min_rows_to_fsync_after_merge, 0, "Minimal number of rows to do fsync for part after merge (0 - disabled)", 0) \
+    M(SettingUInt64, min_compressed_bytes_to_fsync_after_merge, 0, "Minimal number of compressed bytes to do fsync for part after merge (0 - disabled)", 0) \
+    M(SettingUInt64, min_compressed_bytes_to_fsync_after_fetch, 0, "Minimal number of compressed bytes to do fsync for part after fetch (0 - disabled)", 0) \
+    M(SettingBool, fsync_after_insert, false, "Do fsync for every inserted part. Significantly decreases performance of inserts, not recommended to use with wide parts.", 0) \
+    M(SettingBool, fsync_part_directory, false, "Do fsync for part directory after all part operations (writes, renames, etc.).", 0) \
     \
     /** Inserts settings. */ \
     M(SettingUInt64, parts_to_delay_insert, 150, "If table contains at least that many active parts in single partition, artificially slow down insert into table.", 0) \

From 230938d3a3082fbf241c9d873571231a69a5f450 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Sat, 11 Jul 2020 15:12:42 +0800
Subject: [PATCH 004/341] Refactor joinGet and implement multi-key lookup.

---
 src/Functions/FunctionJoinGet.cpp             | 83 +++++++++----------
 src/Functions/FunctionJoinGet.h               | 11 +--
 src/Interpreters/HashJoin.cpp                 | 69 ++++++++-------
 src/Interpreters/HashJoin.h                   | 10 +--
 src/Interpreters/misc.h                       |  2 +-
 .../0_stateless/01080_join_get_null.reference |  2 +-
 .../0_stateless/01080_join_get_null.sql       | 12 +--
 .../01400_join_get_with_multi_keys.reference  |  1 +
 .../01400_join_get_with_multi_keys.sql        |  9 ++
 9 files changed, 104 insertions(+), 95 deletions(-)
 create mode 100644 tests/queries/0_stateless/01400_join_get_with_multi_keys.reference
 create mode 100644 tests/queries/0_stateless/01400_join_get_with_multi_keys.sql

diff --git a/src/Functions/FunctionJoinGet.cpp b/src/Functions/FunctionJoinGet.cpp
index a33b70684a5..1badc689c6a 100644
--- a/src/Functions/FunctionJoinGet.cpp
+++ b/src/Functions/FunctionJoinGet.cpp
@@ -1,10 +1,10 @@
 #include <Functions/FunctionJoinGet.h>
 
+#include <Columns/ColumnString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/HashJoin.h>
-#include <Columns/ColumnString.h>
 #include <Storages/StorageJoin.h>
 
 
@@ -16,19 +16,35 @@ namespace ErrorCodes
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
+template <bool or_null>
+void ExecutableFunctionJoinGet<or_null>::execute(Block & block, const ColumnNumbers & arguments, size_t result, size_t)
+{
+    Block keys;
+    for (size_t i = 2; i < arguments.size(); ++i)
+    {
+        auto key = block.getByPosition(arguments[i]);
+        keys.insert(std::move(key));
+    }
+    block.getByPosition(result) = join->joinGet(keys, result_block);
+}
+
+template <bool or_null>
+ExecutableFunctionImplPtr FunctionJoinGet<or_null>::prepare(const Block &, const ColumnNumbers &, size_t) const
+{
+    return std::make_unique<ExecutableFunctionJoinGet<or_null>>(join, Block{{return_type->createColumn(), return_type, attr_name}});
+}
+
 static auto getJoin(const ColumnsWithTypeAndName & arguments, const Context & context)
 {
-    if (arguments.size() != 3)
-        throw Exception{"Function joinGet takes 3 arguments", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH};
-
     String join_name;
     if (const auto * name_col = checkAndGetColumnConst<ColumnString>(arguments[0].column.get()))
     {
         join_name = name_col->getValue<String>();
     }
     else
-        throw Exception{"Illegal type " + arguments[0].type->getName() + " of first argument of function joinGet, expected a const string.",
-                        ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT};
+        throw Exception(
+            "Illegal type " + arguments[0].type->getName() + " of first argument of function joinGet, expected a const string.",
+            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
 
     size_t dot = join_name.find('.');
     String database_name;
@@ -43,10 +59,12 @@ static auto getJoin(const ColumnsWithTypeAndName & arguments, const Context & co
         ++dot;
     }
     String table_name = join_name.substr(dot);
+    if (table_name.empty())
+        throw Exception("joinGet does not allow empty table name", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
     auto table = DatabaseCatalog::instance().getTable({database_name, table_name}, context);
     auto storage_join = std::dynamic_pointer_cast<StorageJoin>(table);
     if (!storage_join)
-        throw Exception{"Table " + join_name + " should have engine StorageJoin", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT};
+        throw Exception("Table " + join_name + " should have engine StorageJoin", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
 
     String attr_name;
     if (const auto * name_col = checkAndGetColumnConst<ColumnString>(arguments[1].column.get()))
@@ -54,57 +72,30 @@ static auto getJoin(const ColumnsWithTypeAndName & arguments, const Context & co
         attr_name = name_col->getValue<String>();
     }
     else
-        throw Exception{"Illegal type " + arguments[1].type->getName()
-                            + " of second argument of function joinGet, expected a const string.",
-                        ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT};
+        throw Exception(
+            "Illegal type " + arguments[1].type->getName() + " of second argument of function joinGet, expected a const string.",
+            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
     return std::make_pair(storage_join, attr_name);
 }
 
 template <bool or_null>
 FunctionBaseImplPtr JoinGetOverloadResolver<or_null>::build(const ColumnsWithTypeAndName & arguments, const DataTypePtr &) const
 {
+    if (arguments.size() < 3)
+        throw Exception(
+            "Number of arguments for function " + getName() + " doesn't match: passed " + toString(arguments.size())
+                + ", should be greater or equal to 3",
+            ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
     auto [storage_join, attr_name] = getJoin(arguments, context);
     auto join = storage_join->getJoin();
-    DataTypes data_types(arguments.size());
-
+    DataTypes data_types(arguments.size() - 2);
+    for (size_t i = 2; i < arguments.size(); ++i)
+        data_types[i - 2] = arguments[i].type;
+    auto return_type = join->joinGetCheckAndGetReturnType(data_types, attr_name, or_null);
     auto table_lock = storage_join->lockForShare(context.getInitialQueryId(), context.getSettingsRef().lock_acquire_timeout);
-    for (size_t i = 0; i < arguments.size(); ++i)
-        data_types[i] = arguments[i].type;
-
-    auto return_type = join->joinGetReturnType(attr_name, or_null);
     return std::make_unique<FunctionJoinGet<or_null>>(table_lock, storage_join, join, attr_name, data_types, return_type);
 }
 
-template <bool or_null>
-DataTypePtr JoinGetOverloadResolver<or_null>::getReturnType(const ColumnsWithTypeAndName & arguments) const
-{
-    auto [storage_join, attr_name] = getJoin(arguments, context);
-    auto join = storage_join->getJoin();
-    return join->joinGetReturnType(attr_name, or_null);
-}
-
-
-template <bool or_null>
-void ExecutableFunctionJoinGet<or_null>::execute(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count)
-{
-    auto ctn = block.getByPosition(arguments[2]);
-    if (isColumnConst(*ctn.column))
-        ctn.column = ctn.column->cloneResized(1);
-    ctn.name = ""; // make sure the key name never collide with the join columns
-    Block key_block = {ctn};
-    join->joinGet(key_block, attr_name, or_null);
-    auto & result_ctn = key_block.getByPosition(1);
-    if (isColumnConst(*ctn.column))
-        result_ctn.column = ColumnConst::create(result_ctn.column, input_rows_count);
-    block.getByPosition(result) = result_ctn;
-}
-
-template <bool or_null>
-ExecutableFunctionImplPtr FunctionJoinGet<or_null>::prepare(const Block &, const ColumnNumbers &, size_t) const
-{
-    return std::make_unique<ExecutableFunctionJoinGet<or_null>>(join, attr_name);
-}
-
 void registerFunctionJoinGet(FunctionFactory & factory)
 {
     // joinGet
diff --git a/src/Functions/FunctionJoinGet.h b/src/Functions/FunctionJoinGet.h
index a82da589960..6b3b1202f60 100644
--- a/src/Functions/FunctionJoinGet.h
+++ b/src/Functions/FunctionJoinGet.h
@@ -13,14 +13,14 @@ template <bool or_null>
 class ExecutableFunctionJoinGet final : public IExecutableFunctionImpl
 {
 public:
-    ExecutableFunctionJoinGet(HashJoinPtr join_, String attr_name_)
-        : join(std::move(join_)), attr_name(std::move(attr_name_)) {}
+    ExecutableFunctionJoinGet(HashJoinPtr join_, const Block & result_block_)
+        : join(std::move(join_)), result_block(result_block_) {}
 
     static constexpr auto name = or_null ? "joinGetOrNull" : "joinGet";
 
     bool useDefaultImplementationForNulls() const override { return false; }
-    bool useDefaultImplementationForConstants() const override { return true; }
     bool useDefaultImplementationForLowCardinalityColumns() const override { return true; }
+    bool useDefaultImplementationForConstants() const override { return true; }
 
     void execute(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count) override;
 
@@ -28,7 +28,7 @@ public:
 
 private:
     HashJoinPtr join;
-    const String attr_name;
+    Block result_block;
 };
 
 template <bool or_null>
@@ -77,13 +77,14 @@ public:
     String getName() const override { return name; }
 
     FunctionBaseImplPtr build(const ColumnsWithTypeAndName & arguments, const DataTypePtr &) const override;
-    DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments) const override;
+    DataTypePtr getReturnType(const ColumnsWithTypeAndName &) const override { return {}; } // Not used
 
     bool useDefaultImplementationForNulls() const override { return false; }
     bool useDefaultImplementationForLowCardinalityColumns() const override { return true; }
 
     bool isVariadic() const override { return true; }
     size_t getNumberOfArguments() const override { return 0; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {0, 1}; }
 
 private:
     const Context & context;
diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 27294a57675..ffc806b9e88 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -42,6 +42,7 @@ namespace ErrorCodes
     extern const int SYNTAX_ERROR;
     extern const int SET_SIZE_LIMIT_EXCEEDED;
     extern const int TYPE_MISMATCH;
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
 namespace
@@ -1109,27 +1110,34 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
     block = block.cloneWithColumns(std::move(dst_columns));
 }
 
-static void checkTypeOfKey(const Block & block_left, const Block & block_right)
-{
-    const auto & [c1, left_type_origin, left_name] = block_left.safeGetByPosition(0);
-    const auto & [c2, right_type_origin, right_name] = block_right.safeGetByPosition(0);
-    auto left_type = removeNullable(left_type_origin);
-    auto right_type = removeNullable(right_type_origin);
 
-    if (!left_type->equals(*right_type))
-        throw Exception("Type mismatch of columns to joinGet by: "
-            + left_name + " " + left_type->getName() + " at left, "
-            + right_name + " " + right_type->getName() + " at right",
-            ErrorCodes::TYPE_MISMATCH);
-}
-
-
-DataTypePtr HashJoin::joinGetReturnType(const String & column_name, bool or_null) const
+DataTypePtr HashJoin::joinGetCheckAndGetReturnType(const DataTypes & data_types, const String & column_name, bool or_null) const
 {
     std::shared_lock lock(data->rwlock);
 
+    size_t num_keys = data_types.size();
+    if (right_table_keys.columns() != num_keys)
+        throw Exception(
+            "Number of arguments for function joinGet" + toString(or_null ? "OrNull" : "")
+                + " doesn't match: passed, should be equal to " + toString(num_keys),
+            ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
+
+    for (size_t i = 0; i < num_keys; ++i)
+    {
+        const auto & left_type_origin = data_types[i];
+        const auto & [c2, right_type_origin, right_name] = right_table_keys.safeGetByPosition(i);
+        auto left_type = removeNullable(left_type_origin);
+        auto right_type = removeNullable(right_type_origin);
+        if (!left_type->equals(*right_type))
+            throw Exception(
+                "Type mismatch in joinGet key " + toString(i) + ": found type " + left_type->getName() + ", while the needed type is "
+                    + right_type->getName(),
+                ErrorCodes::TYPE_MISMATCH);
+    }
+
     if (!sample_block_with_columns_to_add.has(column_name))
         throw Exception("StorageJoin doesn't contain column " + column_name, ErrorCodes::NO_SUCH_COLUMN_IN_TABLE);
+
     auto elem = sample_block_with_columns_to_add.getByName(column_name);
     if (or_null)
         elem.type = makeNullable(elem.type);
@@ -1138,34 +1146,33 @@ DataTypePtr HashJoin::joinGetReturnType(const String & column_name, bool or_null
 
 
 template <typename Maps>
-void HashJoin::joinGetImpl(Block & block, const Block & block_with_columns_to_add, const Maps & maps_) const
+ColumnWithTypeAndName HashJoin::joinGetImpl(const Block & block, const Block & block_with_columns_to_add, const Maps & maps_) const
 {
-    joinBlockImpl<ASTTableJoin::Kind::Left, ASTTableJoin::Strictness::RightAny>(
-        block, {block.getByPosition(0).name}, block_with_columns_to_add, maps_);
+    // Assemble the key block with correct names.
+    Block keys;
+    for (size_t i = 0; i < block.columns(); ++i)
+    {
+        auto key = block.getByPosition(i);
+        key.name = key_names_right[i];
+        keys.insert(std::move(key));
+    }
+
+    joinBlockImpl<ASTTableJoin::Kind::Left, ASTTableJoin::Strictness::Any>(
+        keys, key_names_right, block_with_columns_to_add, maps_);
+    return keys.getByPosition(keys.columns() - 1);
 }
 
 
-// TODO: support composite key
 // TODO: return multiple columns as named tuple
 // TODO: return array of values when strictness == ASTTableJoin::Strictness::All
-void HashJoin::joinGet(Block & block, const String & column_name, bool or_null) const
+ColumnWithTypeAndName HashJoin::joinGet(const Block & block, const Block & block_with_columns_to_add) const
 {
     std::shared_lock lock(data->rwlock);
 
-    if (key_names_right.size() != 1)
-        throw Exception("joinGet only supports StorageJoin containing exactly one key", ErrorCodes::UNSUPPORTED_JOIN_KEYS);
-
-    checkTypeOfKey(block, right_table_keys);
-
-    auto elem = sample_block_with_columns_to_add.getByName(column_name);
-    if (or_null)
-        elem.type = makeNullable(elem.type);
-    elem.column = elem.type->createColumn();
-
     if ((strictness == ASTTableJoin::Strictness::Any || strictness == ASTTableJoin::Strictness::RightAny) &&
         kind == ASTTableJoin::Kind::Left)
     {
-        joinGetImpl(block, {elem}, std::get<MapsOne>(data->maps));
+        return joinGetImpl(block, block_with_columns_to_add, std::get<MapsOne>(data->maps));
     }
     else
         throw Exception("joinGet only supports StorageJoin of type Left Any", ErrorCodes::INCOMPATIBLE_TYPE_OF_JOIN);
diff --git a/src/Interpreters/HashJoin.h b/src/Interpreters/HashJoin.h
index 67d83d27a6d..025f41ac28f 100644
--- a/src/Interpreters/HashJoin.h
+++ b/src/Interpreters/HashJoin.h
@@ -162,11 +162,11 @@ public:
       */
     void joinBlock(Block & block, ExtraBlockPtr & not_processed) override;
 
-    /// Infer the return type for joinGet function
-    DataTypePtr joinGetReturnType(const String & column_name, bool or_null) const;
+    /// Check joinGet arguments and infer the return type.
+    DataTypePtr joinGetCheckAndGetReturnType(const DataTypes & data_types, const String & column_name, bool or_null) const;
 
-    /// Used by joinGet function that turns StorageJoin into a dictionary
-    void joinGet(Block & block, const String & column_name, bool or_null) const;
+    /// Used by joinGet function that turns StorageJoin into a dictionary.
+    ColumnWithTypeAndName joinGet(const Block & block, const Block & block_with_columns_to_add) const;
 
     /** Keep "totals" (separate part of dataset, see WITH TOTALS) to use later.
       */
@@ -383,7 +383,7 @@ private:
     void joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed) const;
 
     template <typename Maps>
-    void joinGetImpl(Block & block, const Block & block_with_columns_to_add, const Maps & maps_) const;
+    ColumnWithTypeAndName joinGetImpl(const Block & block, const Block & block_with_columns_to_add, const Maps & maps_) const;
 
     static Type chooseMethod(const ColumnRawPtrs & key_columns, Sizes & key_sizes);
 };
diff --git a/src/Interpreters/misc.h b/src/Interpreters/misc.h
index 094dfbbbb81..cae2691ca1f 100644
--- a/src/Interpreters/misc.h
+++ b/src/Interpreters/misc.h
@@ -28,7 +28,7 @@ inline bool functionIsLikeOperator(const std::string & name)
 
 inline bool functionIsJoinGet(const std::string & name)
 {
-    return name == "joinGet" || startsWith(name, "dictGet");
+    return startsWith(name, "joinGet");
 }
 
 inline bool functionIsDictGet(const std::string & name)
diff --git a/tests/queries/0_stateless/01080_join_get_null.reference b/tests/queries/0_stateless/01080_join_get_null.reference
index bfde072a796..0cfbf08886f 100644
--- a/tests/queries/0_stateless/01080_join_get_null.reference
+++ b/tests/queries/0_stateless/01080_join_get_null.reference
@@ -1 +1 @@
-2	2
+2
diff --git a/tests/queries/0_stateless/01080_join_get_null.sql b/tests/queries/0_stateless/01080_join_get_null.sql
index 71e7ddf8e75..9f782452d34 100644
--- a/tests/queries/0_stateless/01080_join_get_null.sql
+++ b/tests/queries/0_stateless/01080_join_get_null.sql
@@ -1,12 +1,12 @@
 DROP TABLE IF EXISTS test_joinGet;
-DROP TABLE IF EXISTS test_join_joinGet;
 
-CREATE TABLE test_joinGet(id Int32, user_id Nullable(Int32)) Engine = Memory();
-CREATE TABLE test_join_joinGet(user_id Int32, name String) Engine = Join(ANY, LEFT, user_id);
+CREATE TABLE test_joinGet(user_id Nullable(Int32), name String) Engine = Join(ANY, LEFT, user_id);
 
-INSERT INTO test_join_joinGet VALUES (2, 'a'), (6, 'b'), (10, 'c');
+INSERT INTO test_joinGet VALUES (2, 'a'), (6, 'b'), (10, 'c'), (null, 'd');
 
-SELECT 2 id, toNullable(toInt32(2)) user_id WHERE joinGet(test_join_joinGet, 'name', user_id) != '';
+SELECT toNullable(toInt32(2)) user_id WHERE joinGet(test_joinGet, 'name', user_id) != '';
+
+-- If the JOIN keys are Nullable fields, the rows where at least one of the keys has the value NULL are not joined.
+SELECT cast(null AS Nullable(Int32)) user_id WHERE joinGet(test_joinGet, 'name', user_id) != '';
 
 DROP TABLE test_joinGet;
-DROP TABLE test_join_joinGet;
diff --git a/tests/queries/0_stateless/01400_join_get_with_multi_keys.reference b/tests/queries/0_stateless/01400_join_get_with_multi_keys.reference
new file mode 100644
index 00000000000..49d59571fbf
--- /dev/null
+++ b/tests/queries/0_stateless/01400_join_get_with_multi_keys.reference
@@ -0,0 +1 @@
+0.1
diff --git a/tests/queries/0_stateless/01400_join_get_with_multi_keys.sql b/tests/queries/0_stateless/01400_join_get_with_multi_keys.sql
new file mode 100644
index 00000000000..73068270762
--- /dev/null
+++ b/tests/queries/0_stateless/01400_join_get_with_multi_keys.sql
@@ -0,0 +1,9 @@
+DROP TABLE IF EXISTS test_joinGet;
+
+CREATE TABLE test_joinGet(a String, b String, c Float64) ENGINE = Join(any, left, a, b);
+
+INSERT INTO test_joinGet VALUES ('ab', '1', 0.1), ('ab', '2', 0.2), ('cd', '3', 0.3);
+
+SELECT joinGet(test_joinGet, 'c', 'ab', '1');
+
+DROP TABLE test_joinGet;

From 40504f6a6e9b54bdcdb0c63a5724648bf5bc04f5 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Fri, 31 Jul 2020 17:57:00 +0300
Subject: [PATCH 005/341] Simpler version of #12999 w/o `pos` changes

---
 programs/client/Client.cpp                    | 126 +++++++++++++-----
 ...06_insert_values_and_expressions.reference |   2 +
 .../00306_insert_values_and_expressions.sql   |   9 ++
 3 files changed, 103 insertions(+), 34 deletions(-)

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 797342a1b44..78a6d7fe2d9 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -908,74 +908,127 @@ private:
         return processMultiQuery(text);
     }
 
-    bool processMultiQuery(const String & text)
+    bool processMultiQuery(const String & all_queries_text)
     {
         const bool test_mode = config().has("testmode");
 
         {   /// disable logs if expects errors
-            TestHint test_hint(test_mode, text);
+            TestHint test_hint(test_mode, all_queries_text);
             if (test_hint.clientError() || test_hint.serverError())
                 processTextAsSingleQuery("SET send_logs_level = 'none'");
         }
 
         /// Several queries separated by ';'.
         /// INSERT data is ended by the end of line, not ';'.
+        /// An exception is VALUES format where we also support semicolon in
+        /// addition to end of line.
 
-        const char * begin = text.data();
-        const char * end = begin + text.size();
+        const char * this_query_begin = all_queries_text.data();
+        const char * all_queries_end = all_queries_text.data() + all_queries_text.size();
 
-        while (begin < end)
+        while (this_query_begin < all_queries_end)
         {
-            const char * pos = begin;
-            ASTPtr orig_ast = parseQuery(pos, end, true);
+            // Use the token iterator to skip any whitespace, semicolons and
+            // comments at the beginning of the query. An example from regression
+            // tests:
+            //      insert into table t values ('invalid'); -- { serverError 469 }
+            //      select 1
+            // Here the test hint comment gets parsed as a part of second query.
+            // We parse the `INSERT VALUES` up to the semicolon, and the rest
+            // looks like a two-line query:
+            //      -- { serverError 469 }
+            //      select 1
+            // and we expect it to fail with error 469, but this hint is actually
+            // for the previous query. Test hints should go after the query, so
+            // we can fix this by skipping leading comments. Token iterator skips
+            // comments and whitespace by itself, so we only have to check for
+            // semicolons.
+            // The code block is to limit visibility of `tokens` because we have
+            // another such variable further down the code, and get warnings for
+            // that.
+            {
+                Tokens tokens(this_query_begin, all_queries_end);
+                IParser::Pos token_iterator(tokens,
+                    context.getSettingsRef().max_parser_depth);
+                while (token_iterator->type == TokenType::Semicolon
+                        && token_iterator.isValid())
+                {
+                    ++token_iterator;
+                }
+                this_query_begin = token_iterator->begin;
+                if (this_query_begin >= all_queries_end)
+                {
+                    break;
+                }
+            }
 
-            if (!orig_ast)
+            // Try to parse the query.
+            const char * this_query_end = this_query_begin;
+            parsed_query = parseQuery(this_query_end, all_queries_end, true);
+
+            if (!parsed_query)
             {
                 if (ignore_error)
                 {
-                    Tokens tokens(begin, end);
+                    Tokens tokens(this_query_begin, all_queries_end);
                     IParser::Pos token_iterator(tokens, context.getSettingsRef().max_parser_depth);
                     while (token_iterator->type != TokenType::Semicolon && token_iterator.isValid())
                         ++token_iterator;
-                    begin = token_iterator->end;
+                    this_query_begin = token_iterator->end;
 
                     continue;
                 }
                 return true;
             }
 
-            auto * insert = orig_ast->as<ASTInsertQuery>();
-
-            if (insert && insert->data)
+            // INSERT queries may have the inserted data in the query text
+            // that follow the query itself, e.g. "insert into t format CSV 1;2".
+            // They need special handling. First of all, here we find where the
+            // inserted data ends. In multy-query mode, it is delimited by a
+            // newline.
+            // The VALUES format needs even more handling -- we also allow the
+            // data to be delimited by semicolon. This case is handled later by
+            // the format parser itself.
+            auto * insert_ast = parsed_query->as<ASTInsertQuery>();
+            if (insert_ast && insert_ast->data)
             {
-                pos = find_first_symbols<'\n'>(insert->data, end);
-                insert->end = pos;
+                this_query_end = find_first_symbols<'\n'>(insert_ast->data, all_queries_end);
+                insert_ast->end = this_query_end;
+                query_to_send = all_queries_text.substr(
+                    this_query_begin - all_queries_text.data(),
+                    insert_ast->data - this_query_begin);
+            }
+            else
+            {
+                query_to_send = all_queries_text.substr(
+                    this_query_begin - all_queries_text.data(),
+                    this_query_end - this_query_begin);
             }
 
-            String str = text.substr(begin - text.data(), pos - begin);
+            // full_query is the query + inline INSERT data.
+            full_query = all_queries_text.substr(
+                this_query_begin - all_queries_text.data(),
+                this_query_end - this_query_begin);
 
-            begin = pos;
-            while (isWhitespaceASCII(*begin) || *begin == ';')
-                ++begin;
-
-            TestHint test_hint(test_mode, str);
+            // Look for the hint in the text of query + insert data, if any.
+            // e.g. insert into t format CSV 'a' -- { serverError 123 }.
+            TestHint test_hint(test_mode, full_query);
             expected_client_error = test_hint.clientError();
             expected_server_error = test_hint.serverError();
 
             try
             {
-                auto ast_to_process = orig_ast;
-                if (insert && insert->data)
+                processParsedSingleQuery();
+
+                if (insert_ast && insert_ast->data)
                 {
-                    ast_to_process = nullptr;
-                    processTextAsSingleQuery(str);
-                }
-                else
-                {
-                    parsed_query = ast_to_process;
-                    full_query = str;
-                    query_to_send = str;
-                    processParsedSingleQuery();
+                    // For VALUES format: use the end of inline data as reported
+                    // by the format parser (it is saved in sendData()). This
+                    // allows us to handle queries like:
+                    //   insert into t values (1); select 1
+                    //, where the inline data is delimited by semicolon and not
+                    // by a newline.
+                    this_query_end = parsed_query->as<ASTInsertQuery>()->end;
                 }
             }
             catch (...)
@@ -983,7 +1036,7 @@ private:
                 last_exception_received_from_server = std::make_unique<Exception>(getCurrentExceptionMessage(true), getCurrentExceptionCode());
                 actual_client_error = last_exception_received_from_server->code();
                 if (!ignore_error && (!actual_client_error || actual_client_error != expected_client_error))
-                    std::cerr << "Error on processing query: " << str << std::endl << last_exception_received_from_server->message();
+                    std::cerr << "Error on processing query: " << full_query << std::endl << last_exception_received_from_server->message();
                 received_exception_from_server = true;
             }
 
@@ -997,6 +1050,8 @@ private:
                 else
                     return false;
             }
+
+            this_query_begin = this_query_end;
         }
 
         return true;
@@ -1407,7 +1462,7 @@ private:
     void sendData(Block & sample, const ColumnsDescription & columns_description)
     {
         /// If INSERT data must be sent.
-        const auto * parsed_insert_query = parsed_query->as<ASTInsertQuery>();
+        auto * parsed_insert_query = parsed_query->as<ASTInsertQuery>();
         if (!parsed_insert_query)
             return;
 
@@ -1416,6 +1471,9 @@ private:
             /// Send data contained in the query.
             ReadBufferFromMemory data_in(parsed_insert_query->data, parsed_insert_query->end - parsed_insert_query->data);
             sendDataFrom(data_in, sample, columns_description);
+            // Remember where the data ended. We use this info later to determine
+            // where the next query begins.
+            parsed_insert_query->end = data_in.buffer().begin() + data_in.count();
         }
         else if (!is_interactive)
         {
diff --git a/tests/queries/0_stateless/00306_insert_values_and_expressions.reference b/tests/queries/0_stateless/00306_insert_values_and_expressions.reference
index 960773dc489..e80a28accf4 100644
--- a/tests/queries/0_stateless/00306_insert_values_and_expressions.reference
+++ b/tests/queries/0_stateless/00306_insert_values_and_expressions.reference
@@ -2,3 +2,5 @@
 2	Hello, world	00000000-0000-0000-0000-000000000000	2016-01-02	2016-01-02 03:04:00	[0,1]
 3	hello, world!	ab41bdd6-5cd4-11e7-907b-a6006ad3dba0	2016-01-03	2016-01-02 03:00:00	[]
 4	World	ab41bdd6-5cd4-11e7-907b-a6006ad3dba0	2016-01-04	2016-12-11 10:09:08	[3,2,1]
+11111
+1
diff --git a/tests/queries/0_stateless/00306_insert_values_and_expressions.sql b/tests/queries/0_stateless/00306_insert_values_and_expressions.sql
index a57e9e69fe6..10a1415f287 100644
--- a/tests/queries/0_stateless/00306_insert_values_and_expressions.sql
+++ b/tests/queries/0_stateless/00306_insert_values_and_expressions.sql
@@ -5,3 +5,12 @@ INSERT INTO insert VALUES (1, 'Hello', 'ab41bdd6-5cd4-11e7-907b-a6006ad3dba0', '
 
 SELECT * FROM insert ORDER BY i;
 DROP TABLE insert;
+
+-- Test the case where the VALUES are delimited by semicolon and a query follows
+-- w/o newline. With most formats the query in the same line would be ignored or
+-- lead to an error, but VALUES are an exception and support semicolon delimiter,
+-- in addition to the newline.
+create table if not exists t_306 (a int) engine Memory;
+insert into t_306 values (1); select 11111;
+select * from t_306;
+drop table if exists t_306;

From 405a6fb08fa22a9e063dd5e48e7ee6060f718749 Mon Sep 17 00:00:00 2001
From: hexiaoting <“hewenting_ict@163.com”>
Date: Mon, 17 Aug 2020 18:20:23 +0800
Subject: [PATCH 006/341] New feature: LineAsString format. #13630

---
 src/Formats/FormatFactory.cpp                 |   1 +
 src/Formats/FormatFactory.h                   |   1 +
 .../Impl/LineAsStringRowInputFormat.cpp       | 101 ++++++++++++++++++
 .../Formats/Impl/LineAsStringRowInputFormat.h |  31 ++++++
 src/Processors/ya.make                        |   1 +
 5 files changed, 135 insertions(+)
 create mode 100644 src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
 create mode 100644 src/Processors/Formats/Impl/LineAsStringRowInputFormat.h

diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 5256ab2b321..f996e3d8cf2 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -365,6 +365,7 @@ FormatFactory::FormatFactory()
     registerInputFormatProcessorMsgPack(*this);
     registerOutputFormatProcessorMsgPack(*this);
     registerInputFormatProcessorJSONAsString(*this);
+    registerInputFormatProcessorLineAsString(*this);
 
     registerFileSegmentationEngineTabSeparated(*this);
     registerFileSegmentationEngineCSV(*this);
diff --git a/src/Formats/FormatFactory.h b/src/Formats/FormatFactory.h
index ea4004c191f..610cf8105b8 100644
--- a/src/Formats/FormatFactory.h
+++ b/src/Formats/FormatFactory.h
@@ -210,5 +210,6 @@ void registerOutputFormatProcessorPostgreSQLWire(FormatFactory & factory);
 void registerInputFormatProcessorCapnProto(FormatFactory & factory);
 void registerInputFormatProcessorRegexp(FormatFactory & factory);
 void registerInputFormatProcessorJSONAsString(FormatFactory & factory);
+void registerInputFormatProcessorLineAsString(FormatFactory & factory);
 
 }
diff --git a/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
new file mode 100644
index 00000000000..a28b3903724
--- /dev/null
+++ b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
@@ -0,0 +1,101 @@
+#include <Processors/Formats/Impl/LineAsStringRowInputFormat.h>
+#include <Formats/JSONEachRowUtils.h>
+#include <common/find_symbols.h>
+#include <IO/ReadHelpers.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int INCORRECT_DATA;
+}
+
+LineAsStringRowInputFormat::LineAsStringRowInputFormat(const Block & header_, ReadBuffer & in_, Params params_) :
+    IRowInputFormat(header_, in_, std::move(params_)), buf(in)
+{
+    if (header_.columns() > 1 || header_.getDataTypes()[0]->getTypeId() != TypeIndex::String)
+    {
+        throw Exception("This input format is only suitable for tables with a single column of type String.", ErrorCodes::LOGICAL_ERROR);
+    }
+}
+
+void LineAsStringRowInputFormat::resetParser()
+{
+    IRowInputFormat::resetParser();
+    buf.reset();
+}
+
+void LineAsStringRowInputFormat::readLineObject(IColumn & column)
+{
+    PeekableReadBufferCheckpoint checkpoint{buf};
+    size_t balance = 0;
+
+    if (*buf.position() != '"')
+        throw Exception("Line object must begin with '\"'.", ErrorCodes::INCORRECT_DATA);
+
+    ++buf.position();
+    ++balance;
+
+    char * pos;
+
+    while (balance)
+    {
+        if (buf.eof())
+            throw Exception("Unexpected end of file while parsing Line object.", ErrorCodes::INCORRECT_DATA);
+
+        pos = find_last_symbols_or_null<'"', '\\'>(buf.position(), buf.buffer().end());
+        buf.position() = pos;
+        if (buf.position() == buf.buffer().end())
+            continue;
+        else if (*buf.position() == '"')
+        {
+            --balance;
+            ++buf.position();
+        }
+        else if (*buf.position() == '\\')
+            {
+            ++buf.position();
+            if (!buf.eof())
+            {
+            	++buf.position();
+            }
+        }
+        
+    }
+    buf.makeContinuousMemoryFromCheckpointToPos();
+    char * end = buf.position();
+    buf.rollbackToCheckpoint();
+    column.insertData(buf.position(), end - buf.position());
+    buf.position() = end;
+}
+
+bool LineAsStringRowInputFormat::readRow(MutableColumns & columns, RowReadExtension &)
+{
+    skipWhitespaceIfAny(buf);
+
+    if (!buf.eof())
+        readLineObject(*columns[0]);
+
+    skipWhitespaceIfAny(buf);
+    if (!buf.eof() && *buf.position() == ',')
+        ++buf.position();
+    skipWhitespaceIfAny(buf);
+
+    return !buf.eof();
+}
+
+void registerInputFormatProcessorLineAsString(FormatFactory & factory)
+{
+    factory.registerInputFormatProcessor("LineAsString", [](
+            ReadBuffer & buf,
+            const Block & sample,
+            const RowInputFormatParams & params,
+            const FormatSettings &)
+    {
+        return std::make_shared<LineAsStringRowInputFormat>(sample, buf, params);
+    });
+}
+
+}
diff --git a/src/Processors/Formats/Impl/LineAsStringRowInputFormat.h b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.h
new file mode 100644
index 00000000000..a31dce1cc4a
--- /dev/null
+++ b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.h
@@ -0,0 +1,31 @@
+#pragma once
+
+#include <Processors/Formats/IRowInputFormat.h>
+#include <Formats/FormatFactory.h>
+#include <IO/PeekableReadBuffer.h>
+
+namespace DB
+{
+
+class ReadBuffer;
+
+/// This format parses a sequence of Line objects separated by newlines, spaces and/or comma.
+/// Each Line object is parsed as a whole to string.
+/// This format can only parse a table with single field of type String.
+
+class LineAsStringRowInputFormat : public IRowInputFormat
+{
+public:
+    LineAsStringRowInputFormat(const Block & header_, ReadBuffer & in_, Params params_);
+
+    bool readRow(MutableColumns & columns, RowReadExtension & ext) override;
+    String getName() const override { return "LineAsStringRowInputFormat"; }
+    void resetParser() override;
+
+private:
+    void readLineObject(IColumn & column);
+
+    PeekableReadBuffer buf;
+};
+
+}
diff --git a/src/Processors/ya.make b/src/Processors/ya.make
index 4c25ad5bf3f..081b1d5ba1f 100644
--- a/src/Processors/ya.make
+++ b/src/Processors/ya.make
@@ -23,6 +23,7 @@ SRCS(
     Formats/Impl/ConstantExpressionTemplate.cpp
     Formats/Impl/CSVRowInputFormat.cpp
     Formats/Impl/CSVRowOutputFormat.cpp
+    Formats/Impl/LineAsStringRowInputFormat.cpp
     Formats/Impl/JSONAsStringRowInputFormat.cpp
     Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
     Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp

From 0451d5729323b7f46d79336fea4f0982bb1662ae Mon Sep 17 00:00:00 2001
From: hexiaoting <“hewenting_ict@163.com”>
Date: Tue, 18 Aug 2020 10:35:08 +0800
Subject: [PATCH 007/341] Add new feature: LineAsString Format

---
 src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp  | 6 ++++++
 .../0_stateless/01460_line_as_string_format.reference       | 1 +
 tests/queries/0_stateless/01460_line_as_string_format.sql   | 5 +++++
 3 files changed, 12 insertions(+)
 create mode 100644 tests/queries/0_stateless/01460_line_as_string_format.reference
 create mode 100644 tests/queries/0_stateless/01460_line_as_string_format.sql

diff --git a/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
index a28b3903724..36844fa700b 100644
--- a/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
@@ -32,6 +32,12 @@ void LineAsStringRowInputFormat::readLineObject(IColumn & column)
     PeekableReadBufferCheckpoint checkpoint{buf};
     size_t balance = 0;
 
+    if (*buf.position() == ';') {
+        ++buf.position();
+        if(buf.eof())
+            return;
+    }
+
     if (*buf.position() != '"')
         throw Exception("Line object must begin with '\"'.", ErrorCodes::INCORRECT_DATA);
 
diff --git a/tests/queries/0_stateless/01460_line_as_string_format.reference b/tests/queries/0_stateless/01460_line_as_string_format.reference
new file mode 100644
index 00000000000..989f8ac0292
--- /dev/null
+++ b/tests/queries/0_stateless/01460_line_as_string_format.reference
@@ -0,0 +1 @@
+"I love apple","I love banana","I love pear"
diff --git a/tests/queries/0_stateless/01460_line_as_string_format.sql b/tests/queries/0_stateless/01460_line_as_string_format.sql
new file mode 100644
index 00000000000..e5518a828d0
--- /dev/null
+++ b/tests/queries/0_stateless/01460_line_as_string_format.sql
@@ -0,0 +1,5 @@
+DROP TABLE IF EXISTS line_as_string;
+CREATE TABLE line_as_string (field String) ENGINE = Memory;
+INSERT INTO line_as_string FORMAT LineAsString "I love apple","I love banana","I love pear";
+SELECT * FROM line_as_string;
+DROP TABLE line_as_string;

From e9be2f14ea8ac45f11c7c65b6c36646b64a5b390 Mon Sep 17 00:00:00 2001
From: hexiaoting <“hewenting_ict@163.com”>
Date: Wed, 19 Aug 2020 11:50:43 +0800
Subject: [PATCH 008/341] fix implementation for \n separated lines

---
 .../Impl/LineAsStringRowInputFormat.cpp       | 45 ++++++-------------
 .../01460_line_as_string_format.reference     |  7 ++-
 .../01460_line_as_string_format.sh            | 19 ++++++++
 .../01460_line_as_string_format.sql           |  5 ---
 4 files changed, 38 insertions(+), 38 deletions(-)
 create mode 100755 tests/queries/0_stateless/01460_line_as_string_format.sh
 delete mode 100644 tests/queries/0_stateless/01460_line_as_string_format.sql

diff --git a/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
index 36844fa700b..27bc71d764d 100644
--- a/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
@@ -30,35 +30,22 @@ void LineAsStringRowInputFormat::resetParser()
 void LineAsStringRowInputFormat::readLineObject(IColumn & column)
 {
     PeekableReadBufferCheckpoint checkpoint{buf};
-    size_t balance = 0;
-
-    if (*buf.position() == ';') {
-        ++buf.position();
-        if(buf.eof())
-            return;
-    }
-
-    if (*buf.position() != '"')
-        throw Exception("Line object must begin with '\"'.", ErrorCodes::INCORRECT_DATA);
-
-    ++buf.position();
-    ++balance;
+    bool newline = true;
+    bool over = false;
 
     char * pos;
 
-    while (balance)
+    while (newline)
     {
-        if (buf.eof())
-            throw Exception("Unexpected end of file while parsing Line object.", ErrorCodes::INCORRECT_DATA);
-
-        pos = find_last_symbols_or_null<'"', '\\'>(buf.position(), buf.buffer().end());
+        pos = find_first_symbols<'\n', '\\'>(buf.position(), buf.buffer().end());
         buf.position() = pos;
-        if (buf.position() == buf.buffer().end())
-            continue;
-        else if (*buf.position() == '"')
+        if (buf.position() == buf.buffer().end())  {
+            over = true;
+            break;
+        }
+        else if (*buf.position() == '\n')
         {
-            --balance;
-            ++buf.position();
+            newline = false;
         }
         else if (*buf.position() == '\\')
             {
@@ -70,25 +57,19 @@ void LineAsStringRowInputFormat::readLineObject(IColumn & column)
         }
         
     }
+
     buf.makeContinuousMemoryFromCheckpointToPos();
-    char * end = buf.position();
+    char * end = over ? buf.position(): ++buf.position();
     buf.rollbackToCheckpoint();
-    column.insertData(buf.position(), end - buf.position());
+    column.insertData(buf.position(), end - (over ? 0 : 1) - buf.position());
     buf.position() = end;
 }
 
 bool LineAsStringRowInputFormat::readRow(MutableColumns & columns, RowReadExtension &)
 {
-    skipWhitespaceIfAny(buf);
-
     if (!buf.eof())
         readLineObject(*columns[0]);
 
-    skipWhitespaceIfAny(buf);
-    if (!buf.eof() && *buf.position() == ',')
-        ++buf.position();
-    skipWhitespaceIfAny(buf);
-
     return !buf.eof();
 }
 
diff --git a/tests/queries/0_stateless/01460_line_as_string_format.reference b/tests/queries/0_stateless/01460_line_as_string_format.reference
index 989f8ac0292..dec67eb2e0a 100644
--- a/tests/queries/0_stateless/01460_line_as_string_format.reference
+++ b/tests/queries/0_stateless/01460_line_as_string_format.reference
@@ -1 +1,6 @@
-"I love apple","I love banana","I love pear"
+"id" : 1,
+"date" : "01.01.2020",
+"string" : "123{{{\\"\\\\",
+"array" : [1, 2, 3],
+
+Finally implement this new feature.
diff --git a/tests/queries/0_stateless/01460_line_as_string_format.sh b/tests/queries/0_stateless/01460_line_as_string_format.sh
new file mode 100755
index 00000000000..a985bc207a8
--- /dev/null
+++ b/tests/queries/0_stateless/01460_line_as_string_format.sh
@@ -0,0 +1,19 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS line_as_string";
+
+$CLICKHOUSE_CLIENT --query="CREATE TABLE line_as_string(field String) ENGINE = Memory";
+
+echo '"id" : 1,
+"date" : "01.01.2020",
+"string" : "123{{{\"\\",
+"array" : [1, 2, 3],
+
+Finally implement this new feature.' | $CLICKHOUSE_CLIENT --query="INSERT INTO line_as_string FORMAT LineAsString";
+
+$CLICKHOUSE_CLIENT --query="SELECT * FROM line_as_string";
+$CLICKHOUSE_CLIENT --query="DROP TABLE line_as_string"
+
diff --git a/tests/queries/0_stateless/01460_line_as_string_format.sql b/tests/queries/0_stateless/01460_line_as_string_format.sql
deleted file mode 100644
index e5518a828d0..00000000000
--- a/tests/queries/0_stateless/01460_line_as_string_format.sql
+++ /dev/null
@@ -1,5 +0,0 @@
-DROP TABLE IF EXISTS line_as_string;
-CREATE TABLE line_as_string (field String) ENGINE = Memory;
-INSERT INTO line_as_string FORMAT LineAsString "I love apple","I love banana","I love pear";
-SELECT * FROM line_as_string;
-DROP TABLE line_as_string;

From 4331158d3051437f44c7fa1271e4673272cf8cac Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Mon, 24 Aug 2020 16:09:23 +0300
Subject: [PATCH 009/341] merge with master

---
 src/Disks/DiskDecorator.cpp                       | 15 +++++++++++++++
 src/Disks/DiskDecorator.h                         |  3 +++
 .../MergeTree/MergeTreeDataPartWriterInMemory.cpp |  2 +-
 .../MergeTree/MergeTreeDataPartWriterInMemory.h   |  2 +-
 src/Storages/MergeTree/MergeTreeDataWriter.cpp    | 11 ++++++-----
 5 files changed, 26 insertions(+), 7 deletions(-)

diff --git a/src/Disks/DiskDecorator.cpp b/src/Disks/DiskDecorator.cpp
index e55534e347f..7f2ea58d7cf 100644
--- a/src/Disks/DiskDecorator.cpp
+++ b/src/Disks/DiskDecorator.cpp
@@ -165,4 +165,19 @@ void DiskDecorator::truncateFile(const String & path, size_t size)
     delegate->truncateFile(path, size);
 }
 
+int DiskDecorator::open(const String & path, mode_t mode) const
+{
+    return delegate->open(path, mode);
+}
+
+void DiskDecorator::close(int fd) const
+{
+    delegate->close(fd);
+}
+
+void DiskDecorator::sync(int fd) const
+{
+    delegate->sync(fd);
+}
+
 }
diff --git a/src/Disks/DiskDecorator.h b/src/Disks/DiskDecorator.h
index 71bb100c576..f1ddfff4952 100644
--- a/src/Disks/DiskDecorator.h
+++ b/src/Disks/DiskDecorator.h
@@ -42,6 +42,9 @@ public:
     void setReadOnly(const String & path) override;
     void createHardLink(const String & src_path, const String & dst_path) override;
     void truncateFile(const String & path, size_t size) override;
+    int open(const String & path, mode_t mode) const override;
+    void close(int fd) const override;
+    void sync(int fd) const override;
     const String getType() const override { return delegate->getType(); }
 
 protected:
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.cpp
index a7486158737..f0738a1130a 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.cpp
@@ -70,7 +70,7 @@ void MergeTreeDataPartWriterInMemory::calculateAndSerializePrimaryIndex(const Bl
     }
 }
 
-void MergeTreeDataPartWriterInMemory::finishDataSerialization(IMergeTreeDataPart::Checksums & checksums)
+void MergeTreeDataPartWriterInMemory::finishDataSerialization(IMergeTreeDataPart::Checksums & checksums, bool)
 {
     /// If part is empty we still need to initialize block by empty columns.
     if (!part_in_memory->block)
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.h b/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.h
index 92e4228a90d..6e59cdd08a9 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.h
@@ -18,7 +18,7 @@ public:
     void write(const Block & block, const IColumn::Permutation * permutation,
         const Block & primary_key_block, const Block & skip_indexes_block) override;
 
-    void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums) override;
+    void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums, bool sync) override;
 
     void calculateAndSerializePrimaryIndex(const Block & primary_index_block) override;
 
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index f3a72657be5..b05b970da3b 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -251,6 +251,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeTempPart(BlockWithPa
     new_data_part->minmax_idx = std::move(minmax_idx);
     new_data_part->is_temp = true;
 
+    std::optional<FileSyncGuard> sync_guard;
     if (new_data_part->isStoredOnDisk())
     {
         /// The name could be non-unique in case of stale files from previous runs.
@@ -262,12 +263,12 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeTempPart(BlockWithPa
             new_data_part->volume->getDisk()->removeRecursive(full_path);
         }
 
-    const auto disk = new_data_part->volume->getDisk();
-    disk->createDirectories(full_path);
+        const auto disk = new_data_part->volume->getDisk();
+        disk->createDirectories(full_path);
 
-    std::optional<FileSyncGuard> sync_guard;
-    if (data.getSettings()->fsync_part_directory)
-        sync_guard.emplace(disk, full_path);
+        if (data.getSettings()->fsync_part_directory)
+            sync_guard.emplace(disk, full_path);
+    }
 
     /// If we need to calculate some columns to sort.
     if (metadata_snapshot->hasSortingKey() || metadata_snapshot->hasSecondaryIndices())

From 25140b9bd5b6421b84ef8586827cc49b9d015e7b Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Tue, 1 Sep 2020 04:39:36 +0300
Subject: [PATCH 010/341] fsync MergeTree format file

---
 src/Storages/MergeTree/MergeTreeData.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index bbefba70c58..bc668659b6a 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -220,6 +220,8 @@ MergeTreeData::MergeTreeData(
         format_version = min_format_version;
         auto buf = version_file.second->writeFile(version_file.first);
         writeIntText(format_version.toUnderType(), *buf);
+        if (global_context.getSettingsRef().fsync_metadata)
+            buf->sync();
     }
     else
     {

From 927eb32e882d070ff5ff5446d5b9e0071e2c6f9d Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Tue, 1 Sep 2020 04:46:40 +0300
Subject: [PATCH 011/341] add test for durability (draft)

---
 utils/durability-test/create.sql         |   1 +
 utils/durability-test/durability-test.sh | 154 +++++++++++++++++++++++
 utils/durability-test/insert.sql         |   1 +
 utils/durability-test/install.sh         |   3 +
 utils/durability-test/sshd_config        |   8 ++
 utils/durability-test/startup.exp        |  23 ++++
 6 files changed, 190 insertions(+)
 create mode 100644 utils/durability-test/create.sql
 create mode 100644 utils/durability-test/durability-test.sh
 create mode 100644 utils/durability-test/insert.sql
 create mode 100644 utils/durability-test/install.sh
 create mode 100644 utils/durability-test/sshd_config
 create mode 100755 utils/durability-test/startup.exp

diff --git a/utils/durability-test/create.sql b/utils/durability-test/create.sql
new file mode 100644
index 00000000000..1ec394100e2
--- /dev/null
+++ b/utils/durability-test/create.sql
@@ -0,0 +1 @@
+CREATE TABLE test (a Int, s String) ENGINE = MergeTree ORDER BY a;
diff --git a/utils/durability-test/durability-test.sh b/utils/durability-test/durability-test.sh
new file mode 100644
index 00000000000..1f47c900f49
--- /dev/null
+++ b/utils/durability-test/durability-test.sh
@@ -0,0 +1,154 @@
+#!/bin/bash
+
+URL=http://cloud-images.ubuntu.com/bionic/current
+IMAGE=bionic-server-cloudimg-amd64.img
+SSH_PORT=11022
+CLICKHOUSE_PORT=9090
+PASSWORD=root
+
+TABLE_NAME=$1
+CREATE_QUERY=$2
+INSERT_QUERY=$3
+
+if [[ -z $TABLE_NAME || -z $CREATE_QUERY || -z $INSERT_QUERY ]]; then
+    echo "Required 3 arguments: table name, file with create query, file with insert query"
+    exit 1
+fi
+
+function run()
+{
+    sshpass -p $PASSWORD ssh -p $SSH_PORT root@localhost "$1"
+}
+
+function copy()
+{
+    sshpass -p $PASSWORD scp -r -P $SSH_PORT $1 root@localhost:$2
+}
+
+function wait_vm_for_start()
+{
+    echo "Waiting until VM started..."
+    started=0
+    for i in {0..100}; do
+        run "exit"
+        if [ $? -eq 0 ]; then
+            started=1
+            break
+        fi 
+        sleep 1s
+    done
+
+    if ((started == 0)); then
+        echo "Can't start or connect to VM."
+        exit 1
+    fi
+
+    echo "Started VM"
+}
+
+function wait_clickhouse_for_start()
+{
+    echo "Waiting until ClickHouse started..."
+    started=0
+    for i in {0..15}; do
+        run "clickhouse client --query 'select 1'"
+        if [ $? -eq 0 ]; then
+            started=1
+            break
+        fi
+        sleep 1s
+    done
+
+    if ((started == 0)); then
+        echo "Can't start ClickHouse."
+    fi
+
+    echo "Started ClickHouse"
+}
+
+echo "Downloading image"
+curl -O $URL/$IMAGE
+
+qemu-img resize $IMAGE +10G
+virt-customize -a $IMAGE --root-password password:$PASSWORD
+virt-copy-in -a $IMAGE sshd_config /etc/ssh
+
+echo "Starting VM"
+
+chmod +x ./startup.exp
+./startup.exp > qemu.log 2>&1 &
+
+wait_vm_for_start
+
+echo "Preparing VM"
+
+# Resize partition
+run "growpart /dev/sda 1 && resize2fs /dev/sda1"
+
+if [[ -z $CLICKHOUSE_BINARY ]]; then
+    CLICKHOUSE_BINARY=/usr/bin/clickhouse
+fi
+
+if [[ -z $CLICKHOUSE_CONFIG_DIR ]]; then
+    CLICKHOUSE_CONFIG_DIR=/etc/clickhouse-server
+fi
+
+echo "Using ClickHouse binary: " $CLICKHOUSE_BINARY
+echo "Using ClickHouse config from: " $CLICKHOUSE_CONFIG_DIR
+
+copy $CLICKHOUSE_BINARY /usr/bin
+copy $CLICKHOUSE_CONFIG_DIR /etc
+run "mv /etc/$CLICKHOUSE_CONFIG_DIR /etc/clickhouse-server"
+
+echo "Prepared VM"
+echo "Starting ClickHouse"
+
+run "clickhouse server --config-file=/etc/clickhouse-server/config.xml > clickhouse-server.log 2>&1" &
+
+wait_clickhouse_for_start
+
+echo "Started ClickHouse"
+
+query=`cat $CREATE_QUERY`
+echo "Executing query:" $query
+run "clickhouse client --query '$query'"
+
+query=`cat $INSERT_QUERY`
+echo "Will run in a loop query: " $query
+run "clickhouse benchmark <<< '$query'" &
+echo "Running queries"
+
+pid=`pidof qemu-system-x86_64`
+sec=$(( (RANDOM % 3) + 25 ))
+
+ms=$(( RANDOM % 1000 ))
+
+echo "Will kill VM in $sec.$ms sec"
+
+sleep $sec.$ms
+kill -9 $pid
+
+echo "Restarting"
+
+./startup.exp > qemu.log 2>&1 &
+wait_vm_for_start
+
+run "rm -r *data/system"
+run "clickhouse server --config-file=/etc/clickhouse-server/config.xml > clickhouse-server.log 2>&1" &
+wait_clickhouse_for_start
+
+result=`run "grep $TABLE_NAME clickhouse-server.log | grep 'Caught exception while loading metadata'"`
+if [[ -n $result ]]; then
+    echo "FAIL. Can't attach table:"
+    echo $result
+    exit 1
+fi
+
+result=`run "grep $TABLE_NAME clickhouse-server.log | grep 'Considering to remove broken part'"`
+if [[ -n $result ]]; then
+    echo "FAIL. Have broken parts:"
+    echo $result
+    exit 1
+fi
+
+echo OK
diff --git a/utils/durability-test/insert.sql b/utils/durability-test/insert.sql
new file mode 100644
index 00000000000..8982ad47228
--- /dev/null
+++ b/utils/durability-test/insert.sql
@@ -0,0 +1 @@
+INSERT INTO test SELECT number, toString(number) FROM numbers(10)
diff --git a/utils/durability-test/install.sh b/utils/durability-test/install.sh
new file mode 100644
index 00000000000..526cde6743f
--- /dev/null
+++ b/utils/durability-test/install.sh
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+apt update && apt install qemu-kvm qemu virt-manager virt-viewer libguestfs-tools sshpass expect
diff --git a/utils/durability-test/sshd_config b/utils/durability-test/sshd_config
new file mode 100644
index 00000000000..6ed06d3d8ad
--- /dev/null
+++ b/utils/durability-test/sshd_config
@@ -0,0 +1,8 @@
+PermitRootLogin yes
+PasswordAuthentication yes
+ChallengeResponseAuthentication no
+UsePAM yes
+X11Forwarding yes
+PrintMotd no
+AcceptEnv LANG LC_*
+Subsystem	sftp	/usr/lib/openssh/sftp-server
diff --git a/utils/durability-test/startup.exp b/utils/durability-test/startup.exp
new file mode 100755
index 00000000000..540cfc0e4b8
--- /dev/null
+++ b/utils/durability-test/startup.exp
@@ -0,0 +1,23 @@
+#!/usr/bin/expect -f
+
+# Wait enough (forever) until a long-time boot
+set timeout -1
+
+spawn qemu-system-x86_64 \
+    -hda bionic-server-cloudimg-amd64.img \
+    -cpu qemu64,+ssse3,+sse4.1,+sse4.2,+popcnt -smp 8 \
+    -net nic -net user,hostfwd=tcp::11022-:22 \
+    -m 4096 -nographic
+
+expect "login: "
+send "root\n"
+
+expect "Password: "
+send "root\n"
+
+# Without it ssh is not working on guest machine for some reason
+expect "# "
+send "dhclient && ssh-keygen -A && systemctl restart sshd.service\n"
+
+# Wait forever
+expect "########"

From 602535396d0ac58c1885ef1d1d3e7c085335f059 Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Tue, 1 Sep 2020 16:36:27 +0800
Subject: [PATCH 012/341] Refactor, move function declarations

---
 src/Formats/FormatFactory.cpp | 100 +++++++++++++++++++++++++++++-----
 src/Formats/FormatFactory.h   |  69 -----------------------
 2 files changed, 85 insertions(+), 84 deletions(-)

diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 935d31d6541..871098e00c0 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -323,13 +323,85 @@ void FormatFactory::registerFileSegmentationEngine(const String & name, FileSegm
     target = std::move(file_segmentation_engine);
 }
 
+/// File Segmentation Engines for parallel reading
+
+void registerFileSegmentationEngineTabSeparated(FormatFactory & factory);
+void registerFileSegmentationEngineCSV(FormatFactory & factory);
+void registerFileSegmentationEngineJSONEachRow(FormatFactory & factory);
+void registerFileSegmentationEngineRegexp(FormatFactory & factory);
+void registerFileSegmentationEngineJSONAsString(FormatFactory & factory);
+
+/// Formats for both input/output.
+
+void registerInputFormatNative(FormatFactory & factory);
+void registerOutputFormatNative(FormatFactory & factory);
+
+void registerInputFormatProcessorNative(FormatFactory & factory);
+void registerOutputFormatProcessorNative(FormatFactory & factory);
+void registerInputFormatProcessorRowBinary(FormatFactory & factory);
+void registerOutputFormatProcessorRowBinary(FormatFactory & factory);
+void registerInputFormatProcessorTabSeparated(FormatFactory & factory);
+void registerOutputFormatProcessorTabSeparated(FormatFactory & factory);
+void registerInputFormatProcessorValues(FormatFactory & factory);
+void registerOutputFormatProcessorValues(FormatFactory & factory);
+void registerInputFormatProcessorCSV(FormatFactory & factory);
+void registerOutputFormatProcessorCSV(FormatFactory & factory);
+void registerInputFormatProcessorTSKV(FormatFactory & factory);
+void registerOutputFormatProcessorTSKV(FormatFactory & factory);
+void registerInputFormatProcessorJSONEachRow(FormatFactory & factory);
+void registerOutputFormatProcessorJSONEachRow(FormatFactory & factory);
+void registerInputFormatProcessorJSONCompactEachRow(FormatFactory & factory);
+void registerOutputFormatProcessorJSONCompactEachRow(FormatFactory & factory);
+void registerInputFormatProcessorProtobuf(FormatFactory & factory);
+void registerOutputFormatProcessorProtobuf(FormatFactory & factory);
+void registerInputFormatProcessorTemplate(FormatFactory & factory);
+void registerOutputFormatProcessorTemplate(FormatFactory & factory);
+void registerInputFormatProcessorMsgPack(FormatFactory & factory);
+void registerOutputFormatProcessorMsgPack(FormatFactory & factory);
+void registerInputFormatProcessorORC(FormatFactory & factory);
+void registerOutputFormatProcessorORC(FormatFactory & factory);
+void registerInputFormatProcessorParquet(FormatFactory & factory);
+void registerOutputFormatProcessorParquet(FormatFactory & factory);
+void registerInputFormatProcessorArrow(FormatFactory & factory);
+void registerOutputFormatProcessorArrow(FormatFactory & factory);
+void registerInputFormatProcessorAvro(FormatFactory & factory);
+void registerOutputFormatProcessorAvro(FormatFactory & factory);
+
+/// Output only (presentational) formats.
+
+void registerOutputFormatNull(FormatFactory & factory);
+
+void registerOutputFormatProcessorPretty(FormatFactory & factory);
+void registerOutputFormatProcessorPrettyCompact(FormatFactory & factory);
+void registerOutputFormatProcessorPrettySpace(FormatFactory & factory);
+void registerOutputFormatProcessorVertical(FormatFactory & factory);
+void registerOutputFormatProcessorJSON(FormatFactory & factory);
+void registerOutputFormatProcessorJSONCompact(FormatFactory & factory);
+void registerOutputFormatProcessorJSONEachRowWithProgress(FormatFactory & factory);
+void registerOutputFormatProcessorXML(FormatFactory & factory);
+void registerOutputFormatProcessorODBCDriver2(FormatFactory & factory);
+void registerOutputFormatProcessorNull(FormatFactory & factory);
+void registerOutputFormatProcessorMySQLWire(FormatFactory & factory);
+void registerOutputFormatProcessorMarkdown(FormatFactory & factory);
+void registerOutputFormatProcessorPostgreSQLWire(FormatFactory & factory);
+
+/// Input only formats.
+
+void registerInputFormatProcessorRegexp(FormatFactory & factory);
+void registerInputFormatProcessorJSONAsString(FormatFactory & factory);
+void registerInputFormatProcessorCapnProto(FormatFactory & factory);
+
 FormatFactory::FormatFactory()
 {
+    registerFileSegmentationEngineTabSeparated(*this);
+    registerFileSegmentationEngineCSV(*this);
+    registerFileSegmentationEngineJSONEachRow(*this);
+    registerFileSegmentationEngineRegexp(*this);
+    registerFileSegmentationEngineJSONAsString(*this);
+
     registerInputFormatNative(*this);
     registerOutputFormatNative(*this);
 
-    registerOutputFormatProcessorJSONEachRowWithProgress(*this);
-
     registerInputFormatProcessorNative(*this);
     registerOutputFormatProcessorNative(*this);
     registerInputFormatProcessorRowBinary(*this);
@@ -348,8 +420,11 @@ FormatFactory::FormatFactory()
     registerOutputFormatProcessorJSONCompactEachRow(*this);
     registerInputFormatProcessorProtobuf(*this);
     registerOutputFormatProcessorProtobuf(*this);
+    registerInputFormatProcessorTemplate(*this);
+    registerOutputFormatProcessorTemplate(*this);
+    registerInputFormatProcessorMsgPack(*this);
+    registerOutputFormatProcessorMsgPack(*this);
 #if !defined(ARCADIA_BUILD)
-    registerInputFormatProcessorCapnProto(*this);
     registerInputFormatProcessorORC(*this);
     registerOutputFormatProcessorORC(*this);
     registerInputFormatProcessorParquet(*this);
@@ -359,18 +434,6 @@ FormatFactory::FormatFactory()
     registerInputFormatProcessorAvro(*this);
     registerOutputFormatProcessorAvro(*this);
 #endif
-    registerInputFormatProcessorTemplate(*this);
-    registerOutputFormatProcessorTemplate(*this);
-    registerInputFormatProcessorRegexp(*this);
-    registerInputFormatProcessorMsgPack(*this);
-    registerOutputFormatProcessorMsgPack(*this);
-    registerInputFormatProcessorJSONAsString(*this);
-
-    registerFileSegmentationEngineTabSeparated(*this);
-    registerFileSegmentationEngineCSV(*this);
-    registerFileSegmentationEngineJSONEachRow(*this);
-    registerFileSegmentationEngineRegexp(*this);
-    registerFileSegmentationEngineJSONAsString(*this);
 
     registerOutputFormatNull(*this);
 
@@ -380,12 +443,19 @@ FormatFactory::FormatFactory()
     registerOutputFormatProcessorVertical(*this);
     registerOutputFormatProcessorJSON(*this);
     registerOutputFormatProcessorJSONCompact(*this);
+    registerOutputFormatProcessorJSONEachRowWithProgress(*this);
     registerOutputFormatProcessorXML(*this);
     registerOutputFormatProcessorODBCDriver2(*this);
     registerOutputFormatProcessorNull(*this);
     registerOutputFormatProcessorMySQLWire(*this);
     registerOutputFormatProcessorMarkdown(*this);
     registerOutputFormatProcessorPostgreSQLWire(*this);
+
+    registerInputFormatProcessorRegexp(*this);
+    registerInputFormatProcessorJSONAsString(*this);
+#if !defined(ARCADIA_BUILD)
+    registerInputFormatProcessorCapnProto(*this);
+#endif
 }
 
 FormatFactory & FormatFactory::instance()
diff --git a/src/Formats/FormatFactory.h b/src/Formats/FormatFactory.h
index f0d2b7826a0..54bff1eefc6 100644
--- a/src/Formats/FormatFactory.h
+++ b/src/Formats/FormatFactory.h
@@ -141,73 +141,4 @@ private:
     const Creators & getCreators(const String & name) const;
 };
 
-/// Formats for both input/output.
-
-void registerInputFormatNative(FormatFactory & factory);
-void registerOutputFormatNative(FormatFactory & factory);
-
-void registerInputFormatProcessorNative(FormatFactory & factory);
-void registerOutputFormatProcessorNative(FormatFactory & factory);
-void registerInputFormatProcessorRowBinary(FormatFactory & factory);
-void registerOutputFormatProcessorRowBinary(FormatFactory & factory);
-void registerInputFormatProcessorTabSeparated(FormatFactory & factory);
-void registerOutputFormatProcessorTabSeparated(FormatFactory & factory);
-void registerInputFormatProcessorValues(FormatFactory & factory);
-void registerOutputFormatProcessorValues(FormatFactory & factory);
-void registerInputFormatProcessorCSV(FormatFactory & factory);
-void registerOutputFormatProcessorCSV(FormatFactory & factory);
-void registerInputFormatProcessorTSKV(FormatFactory & factory);
-void registerOutputFormatProcessorTSKV(FormatFactory & factory);
-void registerInputFormatProcessorJSONEachRow(FormatFactory & factory);
-void registerOutputFormatProcessorJSONEachRow(FormatFactory & factory);
-void registerInputFormatProcessorJSONCompactEachRow(FormatFactory & factory);
-void registerOutputFormatProcessorJSONCompactEachRow(FormatFactory & factory);
-void registerInputFormatProcessorParquet(FormatFactory & factory);
-void registerOutputFormatProcessorParquet(FormatFactory & factory);
-void registerInputFormatProcessorArrow(FormatFactory & factory);
-void registerOutputFormatProcessorArrow(FormatFactory & factory);
-void registerInputFormatProcessorProtobuf(FormatFactory & factory);
-void registerOutputFormatProcessorProtobuf(FormatFactory & factory);
-void registerInputFormatProcessorAvro(FormatFactory & factory);
-void registerOutputFormatProcessorAvro(FormatFactory & factory);
-void registerInputFormatProcessorTemplate(FormatFactory & factory);
-void registerOutputFormatProcessorTemplate(FormatFactory & factory);
-void registerInputFormatProcessorMsgPack(FormatFactory & factory);
-void registerOutputFormatProcessorMsgPack(FormatFactory & factory);
-void registerInputFormatProcessorORC(FormatFactory & factory);
-void registerOutputFormatProcessorORC(FormatFactory & factory);
-
-
-/// File Segmentation Engines for parallel reading
-
-void registerFileSegmentationEngineTabSeparated(FormatFactory & factory);
-void registerFileSegmentationEngineCSV(FormatFactory & factory);
-void registerFileSegmentationEngineJSONEachRow(FormatFactory & factory);
-void registerFileSegmentationEngineRegexp(FormatFactory & factory);
-void registerFileSegmentationEngineJSONAsString(FormatFactory & factory);
-
-/// Output only (presentational) formats.
-
-void registerOutputFormatNull(FormatFactory & factory);
-
-void registerOutputFormatProcessorPretty(FormatFactory & factory);
-void registerOutputFormatProcessorPrettyCompact(FormatFactory & factory);
-void registerOutputFormatProcessorPrettySpace(FormatFactory & factory);
-void registerOutputFormatProcessorPrettyASCII(FormatFactory & factory);
-void registerOutputFormatProcessorVertical(FormatFactory & factory);
-void registerOutputFormatProcessorJSON(FormatFactory & factory);
-void registerOutputFormatProcessorJSONCompact(FormatFactory & factory);
-void registerOutputFormatProcessorJSONEachRowWithProgress(FormatFactory & factory);
-void registerOutputFormatProcessorXML(FormatFactory & factory);
-void registerOutputFormatProcessorODBCDriver2(FormatFactory & factory);
-void registerOutputFormatProcessorNull(FormatFactory & factory);
-void registerOutputFormatProcessorMySQLWire(FormatFactory & factory);
-void registerOutputFormatProcessorMarkdown(FormatFactory & factory);
-void registerOutputFormatProcessorPostgreSQLWire(FormatFactory & factory);
-
-/// Input only formats.
-void registerInputFormatProcessorCapnProto(FormatFactory & factory);
-void registerInputFormatProcessorRegexp(FormatFactory & factory);
-void registerInputFormatProcessorJSONAsString(FormatFactory & factory);
-
 }

From 86fa185bb6fbf8e1e6bc6044a7f4e523477e84db Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Tue, 1 Sep 2020 17:06:28 +0800
Subject: [PATCH 013/341] Add JSONStrings formats

---
 src/Formats/FormatFactory.cpp                 |   6 +
 .../Impl/JSONStringsEachRowRowInputFormat.cpp | 245 ++++++++++++++++++
 .../Impl/JSONStringsEachRowRowInputFormat.h   |  54 ++++
 .../JSONStringsEachRowRowOutputFormat.cpp     | 117 +++++++++
 .../Impl/JSONStringsEachRowRowOutputFormat.h  |  45 ++++
 .../Impl/JSONStringsRowOutputFormat.cpp       |  93 +++++++
 .../Formats/Impl/JSONStringsRowOutputFormat.h |  43 +++
 src/Processors/ya.make                        |   3 +
 8 files changed, 606 insertions(+)
 create mode 100644 src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.cpp
 create mode 100644 src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h
 create mode 100644 src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp
 create mode 100644 src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h
 create mode 100644 src/Processors/Formats/Impl/JSONStringsRowOutputFormat.cpp
 create mode 100644 src/Processors/Formats/Impl/JSONStringsRowOutputFormat.h

diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 871098e00c0..cb378fbea96 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -352,6 +352,8 @@ void registerInputFormatProcessorJSONEachRow(FormatFactory & factory);
 void registerOutputFormatProcessorJSONEachRow(FormatFactory & factory);
 void registerInputFormatProcessorJSONCompactEachRow(FormatFactory & factory);
 void registerOutputFormatProcessorJSONCompactEachRow(FormatFactory & factory);
+void registerInputFormatProcessorJSONStringsEachRow(FormatFactory & factory);
+void registerOutputFormatProcessorJSONStringsEachRow(FormatFactory & factory);
 void registerInputFormatProcessorProtobuf(FormatFactory & factory);
 void registerOutputFormatProcessorProtobuf(FormatFactory & factory);
 void registerInputFormatProcessorTemplate(FormatFactory & factory);
@@ -378,6 +380,7 @@ void registerOutputFormatProcessorVertical(FormatFactory & factory);
 void registerOutputFormatProcessorJSON(FormatFactory & factory);
 void registerOutputFormatProcessorJSONCompact(FormatFactory & factory);
 void registerOutputFormatProcessorJSONEachRowWithProgress(FormatFactory & factory);
+void registerOutputFormatProcessorJSONStrings(FormatFactory & factory);
 void registerOutputFormatProcessorXML(FormatFactory & factory);
 void registerOutputFormatProcessorODBCDriver2(FormatFactory & factory);
 void registerOutputFormatProcessorNull(FormatFactory & factory);
@@ -418,6 +421,8 @@ FormatFactory::FormatFactory()
     registerOutputFormatProcessorJSONEachRow(*this);
     registerInputFormatProcessorJSONCompactEachRow(*this);
     registerOutputFormatProcessorJSONCompactEachRow(*this);
+    registerInputFormatProcessorJSONStringsEachRow(*this);
+    registerOutputFormatProcessorJSONStringsEachRow(*this);
     registerInputFormatProcessorProtobuf(*this);
     registerOutputFormatProcessorProtobuf(*this);
     registerInputFormatProcessorTemplate(*this);
@@ -444,6 +449,7 @@ FormatFactory::FormatFactory()
     registerOutputFormatProcessorJSON(*this);
     registerOutputFormatProcessorJSONCompact(*this);
     registerOutputFormatProcessorJSONEachRowWithProgress(*this);
+    registerOutputFormatProcessorJSONStrings(*this);
     registerOutputFormatProcessorXML(*this);
     registerOutputFormatProcessorODBCDriver2(*this);
     registerOutputFormatProcessorNull(*this);
diff --git a/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.cpp
new file mode 100644
index 00000000000..fff44a204fb
--- /dev/null
+++ b/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.cpp
@@ -0,0 +1,245 @@
+#include <IO/ReadHelpers.h>
+#include <IO/ReadBufferFromString.h>
+
+#include <Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h>
+#include <Formats/FormatFactory.h>
+#include <DataTypes/NestedUtils.h>
+#include <DataTypes/DataTypeNullable.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int INCORRECT_DATA;
+    extern const int CANNOT_READ_ALL_DATA;
+}
+
+
+JSONStringsEachRowRowInputFormat::JSONStringsEachRowRowInputFormat(ReadBuffer & in_,
+        const Block & header_,
+        Params params_,
+        const FormatSettings & format_settings_,
+        bool with_names_)
+        : IRowInputFormat(header_, in_, std::move(params_)), format_settings(format_settings_), with_names(with_names_)
+{
+    const auto & sample = getPort().getHeader();
+    size_t num_columns = sample.columns();
+
+    data_types.resize(num_columns);
+    column_indexes_by_names.reserve(num_columns);
+
+    for (size_t i = 0; i < num_columns; ++i)
+    {
+        const auto & column_info = sample.getByPosition(i);
+
+        data_types[i] = column_info.type;
+        column_indexes_by_names.emplace(column_info.name, i);
+    }
+}
+
+void JSONStringsEachRowRowInputFormat::resetParser()
+{
+    IRowInputFormat::resetParser();
+    column_indexes_for_input_fields.clear();
+    not_seen_columns.clear();
+}
+
+void JSONStringsEachRowRowInputFormat::readPrefix()
+{
+    /// In this format, BOM at beginning of stream cannot be confused with value, so it is safe to skip it.
+    skipBOMIfExists(in);
+
+    if (with_names)
+    {
+        size_t num_columns = getPort().getHeader().columns();
+        read_columns.assign(num_columns, false);
+
+        assertChar('[', in);
+        do
+        {
+            skipWhitespaceIfAny(in);
+            String column_name;
+            readJSONString(column_name, in);
+            addInputColumn(column_name);
+            skipWhitespaceIfAny(in);
+        }
+        while (checkChar(',', in));
+        assertChar(']', in);
+        skipEndOfLine();
+
+        /// Type checking
+        assertChar('[', in);
+        for (size_t i = 0; i < column_indexes_for_input_fields.size(); ++i)
+        {
+            skipWhitespaceIfAny(in);
+            String data_type;
+            readJSONString(data_type, in);
+
+            if (column_indexes_for_input_fields[i] &&
+                data_types[*column_indexes_for_input_fields[i]]->getName() != data_type)
+            {
+                throw Exception(
+                        "Type of '" + getPort().getHeader().getByPosition(*column_indexes_for_input_fields[i]).name
+                        + "' must be " + data_types[*column_indexes_for_input_fields[i]]->getName() +
+                        ", not " + data_type,
+                        ErrorCodes::INCORRECT_DATA
+                );
+            }
+
+            if (i != column_indexes_for_input_fields.size() - 1)
+                assertChar(',', in);
+            skipWhitespaceIfAny(in);
+        }
+        assertChar(']', in);
+    }
+    else
+    {
+        size_t num_columns = getPort().getHeader().columns();
+        read_columns.assign(num_columns, true);
+        column_indexes_for_input_fields.resize(num_columns);
+
+        for (size_t i = 0; i < num_columns; ++i)
+        {
+            column_indexes_for_input_fields[i] = i;
+        }
+    }
+
+    for (size_t i = 0; i < read_columns.size(); ++i)
+    {
+        if (!read_columns[i])
+        {
+            not_seen_columns.emplace_back(i);
+        }
+    }
+}
+
+void JSONStringsEachRowRowInputFormat::addInputColumn(const String & column_name)
+{
+    names_of_columns.emplace_back(column_name);
+
+    const auto column_it = column_indexes_by_names.find(column_name);
+    if (column_it == column_indexes_by_names.end())
+    {
+        if (format_settings.skip_unknown_fields)
+        {
+            column_indexes_for_input_fields.push_back(std::nullopt);
+            return;
+        }
+
+        throw Exception(
+                "Unknown field found in JSONStringsEachRow header: '" + column_name + "' " +
+                "at position " + std::to_string(column_indexes_for_input_fields.size()) +
+                "\nSet the 'input_format_skip_unknown_fields' parameter explicitly to ignore and proceed",
+                ErrorCodes::INCORRECT_DATA
+        );
+    }
+
+    const auto column_index = column_it->second;
+
+    if (read_columns[column_index])
+        throw Exception("Duplicate field found while parsing JSONStringsEachRow header: " + column_name, ErrorCodes::INCORRECT_DATA);
+
+    read_columns[column_index] = true;
+    column_indexes_for_input_fields.emplace_back(column_index);
+}
+
+bool JSONStringsEachRowRowInputFormat::readRow(DB::MutableColumns &columns, DB::RowReadExtension &ext)
+{
+    skipEndOfLine();
+
+    if (in.eof())
+        return false;
+
+    size_t num_columns = columns.size();
+
+    read_columns.assign(num_columns, false);
+
+    assertChar('[', in);
+    for (size_t file_column = 0; file_column < column_indexes_for_input_fields.size(); ++file_column)
+    {
+        const auto & table_column = column_indexes_for_input_fields[file_column];
+        if (table_column)
+        {
+            readField(*table_column, columns);
+        }
+        else
+        {
+            skipJSONField(in, StringRef(names_of_columns[file_column]));
+        }
+
+        skipWhitespaceIfAny(in);
+        if (in.eof())
+            throw Exception("Unexpected end of stream while parsing JSONStringsEachRow format", ErrorCodes::CANNOT_READ_ALL_DATA);
+        if (file_column + 1 != column_indexes_for_input_fields.size())
+        {
+            assertChar(',', in);
+            skipWhitespaceIfAny(in);
+        }
+    }
+    assertChar(']', in);
+
+    for (const auto & name : not_seen_columns)
+        columns[name]->insertDefault();
+
+    ext.read_columns = read_columns;
+    return true;
+}
+
+void JSONStringsEachRowRowInputFormat::skipEndOfLine()
+{
+    skipWhitespaceIfAny(in);
+    if (!in.eof() && (*in.position() == ',' || *in.position() == ';'))
+        ++in.position();
+
+    skipWhitespaceIfAny(in);
+}
+
+void JSONStringsEachRowRowInputFormat::readField(size_t index, MutableColumns & columns)
+{
+    try
+    {
+        read_columns[index] = true;
+        const auto & type = data_types[index];
+
+        String str;
+        readJSONString(str, in);
+
+        ReadBufferFromString buf(str);
+
+        type->deserializeAsWholeText(*columns[index], buf, format_settings);
+    }
+    catch (Exception & e)
+    {
+        e.addMessage("(while read the value of key " +  getPort().getHeader().getByPosition(index).name + ")");
+        throw;
+    }
+}
+
+void JSONStringsEachRowRowInputFormat::syncAfterError()
+{
+    skipToUnescapedNextLineOrEOF(in);
+}
+
+void registerInputFormatProcessorJSONStringsEachRow(FormatFactory & factory)
+{
+    factory.registerInputFormatProcessor("JSONStringsEachRow", [](
+            ReadBuffer & buf,
+            const Block & sample,
+            IRowInputFormat::Params params,
+            const FormatSettings & settings)
+    {
+        return std::make_shared<JSONStringsEachRowRowInputFormat>(buf, sample, std::move(params), settings, false);
+    });
+
+    factory.registerInputFormatProcessor("JSONStringsEachRowWithNamesAndTypes", [](
+            ReadBuffer & buf,
+            const Block & sample,
+            IRowInputFormat::Params params,
+            const FormatSettings & settings)
+    {
+        return std::make_shared<JSONStringsEachRowRowInputFormat>(buf, sample, std::move(params), settings, true);
+    });
+}
+
+}
diff --git a/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h b/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h
new file mode 100644
index 00000000000..ec0a0f7bad9
--- /dev/null
+++ b/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h
@@ -0,0 +1,54 @@
+#pragma once
+
+#pragma once
+
+#include <Core/Block.h>
+#include <Processors/Formats/IRowInputFormat.h>
+#include <Formats/FormatSettings.h>
+#include <Common/HashTable/HashMap.h>
+
+namespace DB
+{
+
+class ReadBuffer;
+
+/** A stream for reading data in JSONStringsEachRow and JSONStringsEachRowWithNamesAndTypes formats
+*/
+class JSONStringsEachRowRowInputFormat : public IRowInputFormat
+{
+public:
+    JSONStringsEachRowRowInputFormat(ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_, bool with_names_);
+
+    String getName() const override { return "JSONStringsEachRowRowInputFormat"; }
+
+
+    void readPrefix() override;
+    bool readRow(MutableColumns & columns, RowReadExtension & ext) override;
+    bool allowSyncAfterError() const override { return true; }
+    void syncAfterError() override;
+    void resetParser() override;
+
+private:
+    void addInputColumn(const String & column_name);
+    void skipEndOfLine();
+    void readField(size_t index, MutableColumns & columns);
+
+    const FormatSettings format_settings;
+
+    using IndexesMap = std::unordered_map<String, size_t>;
+    IndexesMap column_indexes_by_names;
+
+    using OptionalIndexes = std::vector<std::optional<size_t>>;
+    OptionalIndexes column_indexes_for_input_fields;
+
+    DataTypes data_types;
+    std::vector<UInt8> read_columns;
+    std::vector<size_t> not_seen_columns;
+
+    /// This is for the correct exceptions in skipping unknown fields.
+    std::vector<String> names_of_columns;
+
+    bool with_names;
+};
+
+}
diff --git a/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp
new file mode 100644
index 00000000000..75007ea236e
--- /dev/null
+++ b/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp
@@ -0,0 +1,117 @@
+#include <IO/WriteHelpers.h>
+#include <IO/WriteBufferValidUTF8.h>
+#include <Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h>
+#include <Formats/FormatFactory.h>
+
+
+namespace DB
+{
+
+
+JSONStringsEachRowRowOutputFormat::JSONStringsEachRowRowOutputFormat(WriteBuffer & out_,
+        const Block & header_,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & settings_,
+        bool with_names_)
+        : IRowOutputFormat(header_, out_, callback), settings(settings_), with_names(with_names_)
+{
+            const auto & sample = getPort(PortKind::Main).getHeader();
+            NamesAndTypesList columns(sample.getNamesAndTypesList());
+            fields.assign(columns.begin(), columns.end());
+}
+
+
+void JSONStringsEachRowRowOutputFormat::writeField(const IColumn & column, const IDataType & type, size_t row_num)
+{
+    WriteBufferFromOwnString buf;
+
+    type.serializeAsText(column, row_num, buf, settings);
+    writeJSONString(buf.str(), out, settings);
+}
+
+
+void JSONStringsEachRowRowOutputFormat::writeFieldDelimiter()
+{
+    writeCString(", ", out);
+}
+
+
+void JSONStringsEachRowRowOutputFormat::writeRowStartDelimiter()
+{
+    writeChar('[', out);
+}
+
+
+void JSONStringsEachRowRowOutputFormat::writeRowEndDelimiter()
+{
+    writeCString("]\n", out);
+}
+
+void JSONStringsEachRowRowOutputFormat::writeTotals(const Columns & columns, size_t row_num)
+{
+    writeChar('\n', out);
+    size_t num_columns = columns.size();
+    writeChar('[', out);
+    for (size_t i = 0; i < num_columns; ++i)
+    {
+        if (i != 0)
+            JSONStringsEachRowRowOutputFormat::writeFieldDelimiter();
+
+        JSONStringsEachRowRowOutputFormat::writeField(*columns[i], *types[i], row_num);
+    }
+    writeCString("]\n", out);
+}
+
+void JSONStringsEachRowRowOutputFormat::writePrefix()
+{
+    if (with_names)
+    {
+        writeChar('[', out);
+        for (size_t i = 0; i < fields.size(); ++i)
+        {
+            writeChar('\"', out);
+            writeString(fields[i].name, out);
+            writeChar('\"', out);
+            if (i != fields.size() - 1)
+                writeCString(", ", out);
+        }
+        writeCString("]\n[", out);
+        for (size_t i = 0; i < fields.size(); ++i)
+        {
+            writeJSONString(fields[i].type->getName(), out, settings);
+            if (i != fields.size() - 1)
+                writeCString(", ", out);
+        }
+        writeCString("]\n", out);
+    }
+}
+
+void JSONStringsEachRowRowOutputFormat::consumeTotals(DB::Chunk chunk)
+{
+    if (with_names)
+        IRowOutputFormat::consumeTotals(std::move(chunk));
+}
+
+void registerOutputFormatProcessorJSONStringsEachRow(FormatFactory & factory)
+{
+    factory.registerOutputFormatProcessor("JSONStringsEachRow", [](
+            WriteBuffer & buf,
+            const Block & sample,
+            FormatFactory::WriteCallback callback,
+            const FormatSettings & format_settings)
+    {
+        return std::make_shared<JSONStringsEachRowRowOutputFormat>(buf, sample, callback, format_settings, false);
+    });
+
+    factory.registerOutputFormatProcessor("JSONStringsEachRowWithNamesAndTypes", [](
+            WriteBuffer &buf,
+            const Block &sample,
+            FormatFactory::WriteCallback callback,
+            const FormatSettings &format_settings)
+    {
+        return std::make_shared<JSONStringsEachRowRowOutputFormat>(buf, sample, callback, format_settings, true);
+    });
+}
+
+
+}
diff --git a/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h
new file mode 100644
index 00000000000..1d43a333da1
--- /dev/null
+++ b/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h
@@ -0,0 +1,45 @@
+#pragma once
+
+#include <Core/Block.h>
+#include <IO/WriteBuffer.h>
+#include <Processors/Formats/IRowOutputFormat.h>
+#include <Formats/FormatSettings.h>
+
+
+namespace DB
+{
+
+/** The stream for outputting data in JSON format, by object per line.
+  * Does not validate UTF-8.
+  */
+class JSONStringsEachRowRowOutputFormat : public IRowOutputFormat
+{
+public:
+    JSONStringsEachRowRowOutputFormat(WriteBuffer & out_, const Block & header_, FormatFactory::WriteCallback callback, const FormatSettings & settings_, bool with_names);
+
+    String getName() const override { return "JSONStringsEachRowRowOutputFormat"; }
+
+    void writePrefix() override;
+
+    void writeBeforeTotals() override {}
+    void writeTotals(const Columns & columns, size_t row_num) override;
+    void writeAfterTotals() override {}
+
+    void writeField(const IColumn & column, const IDataType & type, size_t row_num) override;
+    void writeFieldDelimiter() override;
+    void writeRowStartDelimiter() override;
+    void writeRowEndDelimiter() override;
+
+protected:
+    void consumeTotals(Chunk) override;
+    /// No extremes.
+    void consumeExtremes(Chunk) override {}
+
+private:
+    FormatSettings settings;
+
+    NamesAndTypes fields;
+
+    bool with_names;
+};
+}
diff --git a/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.cpp
new file mode 100644
index 00000000000..6ccb315f73f
--- /dev/null
+++ b/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.cpp
@@ -0,0 +1,93 @@
+#include <Processors/Formats/Impl/JSONStringsRowOutputFormat.h>
+#include <Formats/FormatFactory.h>
+
+#include <IO/WriteHelpers.h>
+
+
+namespace DB
+{
+
+JSONStringsRowOutputFormat::JSONStringsRowOutputFormat(
+    WriteBuffer & out_, const Block & header, FormatFactory::WriteCallback callback, const FormatSettings & settings_)
+    : JSONRowOutputFormat(out_, header, callback, settings_)
+{
+}
+
+
+void JSONStringsRowOutputFormat::writeField(const IColumn & column, const IDataType & type, size_t row_num)
+{
+    WriteBufferFromOwnString buf;
+
+    type.serializeAsText(column, row_num, buf, settings);
+    writeJSONString(buf.str(), *ostr, settings);
+    ++field_number;
+}
+
+
+void JSONStringsRowOutputFormat::writeFieldDelimiter()
+{
+    writeCString(", ", *ostr);
+}
+
+void JSONStringsRowOutputFormat::writeTotalsFieldDelimiter()
+{
+    writeCString(",", *ostr);
+}
+
+
+void JSONStringsRowOutputFormat::writeRowStartDelimiter()
+{
+    writeCString("\t\t[", *ostr);
+}
+
+
+void JSONStringsRowOutputFormat::writeRowEndDelimiter()
+{
+    writeChar(']', *ostr);
+    field_number = 0;
+    ++row_count;
+}
+
+void JSONStringsRowOutputFormat::writeBeforeTotals()
+{
+    writeCString(",\n", *ostr);
+    writeChar('\n', *ostr);
+    writeCString("\t\"totals\": [", *ostr);
+}
+
+void JSONStringsRowOutputFormat::writeAfterTotals()
+{
+    writeChar(']', *ostr);
+}
+
+void JSONStringsRowOutputFormat::writeExtremesElement(const char * title, const Columns & columns, size_t row_num)
+{
+    writeCString("\t\t\"", *ostr);
+    writeCString(title, *ostr);
+    writeCString("\": [", *ostr);
+
+    size_t extremes_columns = columns.size();
+    for (size_t i = 0; i < extremes_columns; ++i)
+    {
+        if (i != 0)
+            writeTotalsFieldDelimiter();
+
+        writeField(*columns[i], *types[i], row_num);
+    }
+
+    writeChar(']', *ostr);
+}
+
+void registerOutputFormatProcessorJSONStrings(FormatFactory & factory)
+{
+    factory.registerOutputFormatProcessor("JSONStrings", [](
+        WriteBuffer & buf,
+        const Block & sample,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & format_settings)
+    {
+        return std::make_shared<JSONStringsRowOutputFormat>(buf, sample, callback, format_settings);
+    });
+}
+
+}
diff --git a/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.h b/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.h
new file mode 100644
index 00000000000..b221bc9ee36
--- /dev/null
+++ b/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.h
@@ -0,0 +1,43 @@
+#pragma once
+
+#include <Core/Block.h>
+#include <IO/WriteBuffer.h>
+#include <IO/WriteBufferValidUTF8.h>
+#include <Processors/Formats/Impl/JSONRowOutputFormat.h>
+
+
+namespace DB
+{
+
+struct FormatSettings;
+
+/** The stream for outputting data in the JSONStrings format.
+  */
+class JSONStringsRowOutputFormat : public JSONRowOutputFormat
+{
+public:
+    JSONStringsRowOutputFormat(WriteBuffer & out_, const Block & header, FormatFactory::WriteCallback callback, const FormatSettings & settings_);
+
+    String getName() const override { return "JSONStringsRowOutputFormat"; }
+
+    void writeField(const IColumn & column, const IDataType & type, size_t row_num) override;
+    void writeFieldDelimiter() override;
+    void writeRowStartDelimiter() override;
+    void writeRowEndDelimiter() override;
+
+    void writeBeforeTotals() override;
+    void writeAfterTotals() override;
+
+protected:
+    void writeExtremesElement(const char * title, const Columns & columns, size_t row_num) override;
+
+    void writeTotalsField(const IColumn & column, const IDataType & type, size_t row_num) override
+    {
+        return writeField(column, type, row_num);
+    }
+
+    void writeTotalsFieldDelimiter() override;
+
+};
+
+}
diff --git a/src/Processors/ya.make b/src/Processors/ya.make
index 30de38fedbd..27893674859 100644
--- a/src/Processors/ya.make
+++ b/src/Processors/ya.make
@@ -31,6 +31,9 @@ SRCS(
     Formats/Impl/JSONEachRowRowOutputFormat.cpp
     Formats/Impl/JSONEachRowWithProgressRowOutputFormat.cpp
     Formats/Impl/JSONRowOutputFormat.cpp
+    Formats/Impl/JSONStringsEachRowRowInputFormat.cpp
+    Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp
+    Formats/Impl/JSONStringsRowOutputFormat.cpp
     Formats/Impl/MarkdownRowOutputFormat.cpp
     Formats/Impl/MsgPackRowInputFormat.cpp
     Formats/Impl/MsgPackRowOutputFormat.cpp

From c25a99aaf58108651149930db5ef86e1313120c4 Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Tue, 1 Sep 2020 17:47:37 +0800
Subject: [PATCH 014/341] Add tests

---
 .../01446_JSONStringsEachRow.reference        | 47 ++++++++++++++
 .../0_stateless/01446_JSONStringsEachRow.sql  | 63 +++++++++++++++++++
 .../0_stateless/01447_JSONStrings.reference   | 43 +++++++++++++
 .../queries/0_stateless/01447_JSONStrings.sql |  8 +++
 4 files changed, 161 insertions(+)
 create mode 100644 tests/queries/0_stateless/01446_JSONStringsEachRow.reference
 create mode 100644 tests/queries/0_stateless/01446_JSONStringsEachRow.sql
 create mode 100644 tests/queries/0_stateless/01447_JSONStrings.reference
 create mode 100644 tests/queries/0_stateless/01447_JSONStrings.sql

diff --git a/tests/queries/0_stateless/01446_JSONStringsEachRow.reference b/tests/queries/0_stateless/01446_JSONStringsEachRow.reference
new file mode 100644
index 00000000000..0b05f050b29
--- /dev/null
+++ b/tests/queries/0_stateless/01446_JSONStringsEachRow.reference
@@ -0,0 +1,47 @@
+1
+["1", "a"]
+["2", "b"]
+["3", "c"]
+2
+["a", "1"]
+["b", "1"]
+["c", "1"]
+3
+["value", "name"]
+["UInt8", "String"]
+["1", "a"]
+["2", "b"]
+["3", "c"]
+4
+["name", "c"]
+["String", "UInt64"]
+["a", "1"]
+["b", "1"]
+["c", "1"]
+
+["", "3"]
+5
+["first", "1", "2", "0"]
+["second", "2", "0", "6"]
+6
+["first", "1", "2", "0"]
+["second", "2", "0", "6"]
+7
+["16", "[15,16,17]", "['first','second','third']"]
+8
+["first", "1", "2", "0"]
+["second", "2", "0", "6"]
+9
+["first", "1", "2", "0"]
+["second", "2", "0", "6"]
+10
+["first", "1", "16", "8"]
+["second", "2", "32", "8"]
+11
+["v1", "v2", "v3", "v4"]
+["String", "UInt8", "UInt16", "UInt8"]
+["", "2", "3", "1"]
+12
+["v1", "n.id", "n.name"]
+["UInt8", "Array(UInt8)", "Array(String)"]
+["16", "[15,16,17]", "['first','second','third']"]
diff --git a/tests/queries/0_stateless/01446_JSONStringsEachRow.sql b/tests/queries/0_stateless/01446_JSONStringsEachRow.sql
new file mode 100644
index 00000000000..f461b217fe4
--- /dev/null
+++ b/tests/queries/0_stateless/01446_JSONStringsEachRow.sql
@@ -0,0 +1,63 @@
+DROP TABLE IF EXISTS test_table;
+DROP TABLE IF EXISTS test_table_2;
+SELECT 1;
+/* Check JSONStringsEachRow Output */
+CREATE TABLE test_table (value UInt8, name String) ENGINE = MergeTree() ORDER BY value;
+INSERT INTO test_table VALUES (1, 'a'), (2, 'b'), (3, 'c');
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+SELECT 2;
+/* Check Totals */
+SELECT name, count() AS c FROM test_table GROUP BY name WITH TOTALS ORDER BY name FORMAT JSONStringsEachRow;
+SELECT 3;
+/* Check JSONStringsEachRowWithNamesAndTypes Output */
+SELECT * FROM test_table FORMAT JSONStringsEachRowWithNamesAndTypes;
+SELECT 4;
+/* Check Totals */
+SELECT name, count() AS c FROM test_table GROUP BY name WITH TOTALS ORDER BY name FORMAT JSONStringsEachRowWithNamesAndTypes;
+DROP TABLE IF EXISTS test_table;
+SELECT 5;
+/* Check JSONStringsEachRow Input */
+CREATE TABLE test_table (v1 String, v2 UInt8, v3 DEFAULT v2 * 16, v4 UInt8 DEFAULT 8) ENGINE = MergeTree() ORDER BY v2;
+INSERT INTO test_table FORMAT JSONStringsEachRow ["first", "1", "2", "NULL"] ["second", "2", "null", "6"];
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+TRUNCATE TABLE test_table;
+SELECT 6;
+/* Check input_format_null_as_default = 1 */
+SET input_format_null_as_default = 1;
+INSERT INTO test_table FORMAT JSONStringsEachRow ["first", "1", "2", "ᴺᵁᴸᴸ"] ["second", "2", "null", "6"];
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+TRUNCATE TABLE test_table;
+SELECT 7;
+/* Check Nested */
+CREATE TABLE test_table_2 (v1 UInt8, n Nested(id UInt8, name String)) ENGINE = MergeTree() ORDER BY v1;
+INSERT INTO test_table_2 FORMAT JSONStringsEachRow ["16", "[15, 16, 17]", "['first', 'second', 'third']"];
+SELECT * FROM test_table_2 FORMAT JSONStringsEachRow;
+TRUNCATE TABLE test_table_2;
+SELECT 8;
+/* Check JSONStringsEachRowWithNamesAndTypes Output */
+SET input_format_null_as_default = 0;
+INSERT INTO test_table FORMAT JSONStringsEachRowWithNamesAndTypes ["v1", "v2", "v3", "v4"]["String","UInt8","UInt16","UInt8"]["first", "1", "2", "null"]["second", "2", "null", "6"];
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+TRUNCATE TABLE test_table;
+SELECT 9;
+/* Check input_format_null_as_default = 1 */
+SET input_format_null_as_default = 1;
+INSERT INTO test_table FORMAT JSONStringsEachRowWithNamesAndTypes ["v1", "v2", "v3", "v4"]["String","UInt8","UInt16","UInt8"]["first", "1", "2", "null"] ["second", "2", "null", "6"];
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+SELECT 10;
+/* Check Header */
+TRUNCATE TABLE test_table;
+SET input_format_skip_unknown_fields = 1;
+INSERT INTO test_table FORMAT JSONStringsEachRowWithNamesAndTypes ["v1", "v2", "invalid_column"]["String", "UInt8", "UInt8"]["first", "1", "32"]["second", "2", "64"];
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+SELECT 11;
+TRUNCATE TABLE test_table;
+INSERT INTO test_table FORMAT JSONStringsEachRowWithNamesAndTypes ["v4", "v2", "v3"]["UInt8", "UInt8", "UInt16"]["1", "2", "3"]
+SELECT * FROM test_table FORMAT JSONStringsEachRowWithNamesAndTypes;
+SELECT 12;
+/* Check Nested */
+INSERT INTO test_table_2 FORMAT JSONStringsEachRowWithNamesAndTypes ["v1", "n.id", "n.name"]["UInt8", "Array(UInt8)", "Array(String)"]["16", "[15, 16, 17]", "['first', 'second', 'third']"];
+SELECT * FROM test_table_2 FORMAT JSONStringsEachRowWithNamesAndTypes;
+
+DROP TABLE IF EXISTS test_table;
+DROP TABLE IF EXISTS test_table_2;
diff --git a/tests/queries/0_stateless/01447_JSONStrings.reference b/tests/queries/0_stateless/01447_JSONStrings.reference
new file mode 100644
index 00000000000..58af593dc77
--- /dev/null
+++ b/tests/queries/0_stateless/01447_JSONStrings.reference
@@ -0,0 +1,43 @@
+{
+	"meta":
+	[
+		{
+			"name": "1",
+			"type": "UInt8"
+		},
+		{
+			"name": "'a'",
+			"type": "String"
+		},
+		{
+			"name": "[1, 2, 3]",
+			"type": "Array(UInt8)"
+		},
+		{
+			"name": "tuple(1, 'a')",
+			"type": "Tuple(UInt8, String)"
+		},
+		{
+			"name": "NULL",
+			"type": "Nullable(Nothing)"
+		},
+		{
+			"name": "nan",
+			"type": "Float64"
+		}
+	],
+
+	"data":
+	[
+		["1", "a", "[1,2,3]", "(1,'a')", "ᴺᵁᴸᴸ", "nan"]
+	],
+
+	"rows": 1,
+
+	"statistics":
+	{
+		"elapsed": 0.00068988,
+		"rows_read": 1,
+		"bytes_read": 1
+	}
+}
diff --git a/tests/queries/0_stateless/01447_JSONStrings.sql b/tests/queries/0_stateless/01447_JSONStrings.sql
new file mode 100644
index 00000000000..7d89f0f5087
--- /dev/null
+++ b/tests/queries/0_stateless/01447_JSONStrings.sql
@@ -0,0 +1,8 @@
+SELECT
+    1,
+    'a',
+    [1, 2, 3],
+    (1, 'a'),
+    null,
+    nan
+FORMAT JSONStrings;

From 6d37c9d2a68ca3f6ae39c9bc0bb99424d7fc236e Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Tue, 1 Sep 2020 17:48:03 +0800
Subject: [PATCH 015/341] Update docs about formats

---
 docs/en/interfaces/formats.md | 26 +++++++++++++++++++-------
 1 file changed, 19 insertions(+), 7 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 9d3965b4a9c..9c7c2dda8dc 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -26,7 +26,10 @@ The supported formats are:
 | [VerticalRaw](#verticalraw)                                     | ✗     | ✔      |
 | [JSON](#json)                                                   | ✗     | ✔      |
 | [JSONCompact](#jsoncompact)                                     | ✗     | ✔      |
+| [JSONStrings](#jsonstrings)                                     | ✗     | ✔      |
 | [JSONEachRow](#jsoneachrow)                                     | ✔     | ✔      |
+| [JSONCompactEachRow](#jsoncompacteachrow)                       | ✔     | ✔      |
+| [JSONStringsEachRow](#jsonstringseachrow)                       | ✔     | ✔      |
 | [TSKV](#tskv)                                                   | ✔     | ✔      |
 | [Pretty](#pretty)                                               | ✗     | ✔      |
 | [PrettyCompact](#prettycompact)                                 | ✗     | ✔      |
@@ -470,7 +473,7 @@ See also the [JSONEachRow](#jsoneachrow) format.
 
 ## JSONCompact {#jsoncompact}
 
-Differs from JSON only in that data rows are output in arrays, not in objects.
+Differs from JSON only in that data rows are output in arrays of any element type, not in objects.
 
 Example:
 
@@ -514,17 +517,26 @@ Example:
 This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
 See also the `JSONEachRow` format.
 
-## JSONEachRow {#jsoneachrow}
+## JSONStrings {#jsonstrings}
 
-When using this format, ClickHouse outputs rows as separated, newline-delimited JSON objects, but the data as a whole is not valid JSON.
+Differs from JSON and JSONCompact only in that data rows are output in arrays of strings.
+
+This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
+See also the `JSONEachRow` format.
+
+## JSONEachRow {#jsoneachrow}
+## JSONCompactEachRow {#jsoncompacteachrow}
+## JSONStringsEachRow {#jsonstringseachrow}
+
+When using these formats, ClickHouse outputs rows as separated, newline-delimited JSON values, but the data as a whole is not valid JSON.
 
 ``` json
-{"SearchPhrase":"curtain designs","count()":"1064"}
-{"SearchPhrase":"baku","count()":"1000"}
-{"SearchPhrase":"","count()":"8267016"}
+{"some_int":42,"some_str":"hello","some_tuple":[1,"a"]} // JSONEachRow
+[42,"hello",[1,"a"]] // JSONCompactEachRow
+["42","hello","(2,'a')"] // JSONStringsEachRow
 ```
 
-When inserting the data, you should provide a separate JSON object for each row.
+When inserting the data, you should provide a separate JSON value for each row.
 
 ### Inserting Data {#inserting-data}
 

From babd3beec09054d1dc4b1b8a35cf30da013f05af Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Tue, 1 Sep 2020 17:48:19 +0800
Subject: [PATCH 016/341] Fix nullable data parsing

---
 src/DataTypes/DataTypeNullable.cpp | 11 +++++++++--
 1 file changed, 9 insertions(+), 2 deletions(-)

diff --git a/src/DataTypes/DataTypeNullable.cpp b/src/DataTypes/DataTypeNullable.cpp
index 847047850fd..3318196b951 100644
--- a/src/DataTypes/DataTypeNullable.cpp
+++ b/src/DataTypes/DataTypeNullable.cpp
@@ -308,7 +308,10 @@ ReturnType DataTypeNullable::deserializeTextQuoted(IColumn & column, ReadBuffer
                                                    const DataTypePtr & nested_data_type)
 {
     return safeDeserialize<ReturnType>(column, *nested_data_type,
-        [&istr] { return checkStringByFirstCharacterAndAssertTheRestCaseInsensitive("NULL", istr); },
+        [&istr]
+        {
+            return checkStringByFirstCharacterAndAssertTheRestCaseInsensitive("NULL", istr);
+        },
         [&nested_data_type, &istr, &settings] (IColumn & nested) { nested_data_type->deserializeAsTextQuoted(nested, istr, settings); });
 }
 
@@ -316,7 +319,11 @@ ReturnType DataTypeNullable::deserializeTextQuoted(IColumn & column, ReadBuffer
 void DataTypeNullable::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     safeDeserialize(column, *nested_data_type,
-        [&istr] { return checkStringByFirstCharacterAndAssertTheRestCaseInsensitive("NULL", istr); },
+        [&istr]
+        {
+            return checkStringByFirstCharacterAndAssertTheRestCaseInsensitive("NULL", istr)
+                || checkStringByFirstCharacterAndAssertTheRest("ᴺᵁᴸᴸ", istr);
+        },
         [this, &istr, &settings] (IColumn & nested) { nested_data_type->deserializeAsWholeText(nested, istr, settings); });
 }
 

From 3cadc9033ae63d7faa851b1707b3c6f9ce1a36aa Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Tue, 1 Sep 2020 18:26:49 +0300
Subject: [PATCH 017/341] fsyncs for metadata files of part

---
 .../MergeTree/IMergeTreeDataPartWriter.h      |  2 +-
 .../MergeTreeDataPartWriterOnDisk.cpp         |  2 +-
 .../MergeTree/MergedBlockOutputStream.cpp     | 13 +++++++--
 .../MergeTree/MergedBlockOutputStream.h       |  3 +-
 utils/durability-test/create_sync.sql         |  1 +
 utils/durability-test/durability-test.sh      | 28 ++++++++++---------
 utils/durability-test/insert_sync.sql         |  1 +
 7 files changed, 32 insertions(+), 18 deletions(-)
 create mode 100644 utils/durability-test/create_sync.sql
 mode change 100644 => 100755 utils/durability-test/durability-test.sh
 create mode 100644 utils/durability-test/insert_sync.sql

diff --git a/src/Storages/MergeTree/IMergeTreeDataPartWriter.h b/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
index 4d3602e732e..4a42a58a65b 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
@@ -52,7 +52,7 @@ public:
     virtual void initPrimaryIndex() {}
 
     virtual void finishDataSerialization(IMergeTreeDataPart::Checksums & checksums, bool sync) = 0;
-    virtual void finishPrimaryIndexSerialization(MergeTreeData::DataPart::Checksums & /* checksums */,  bool /* sync */) {}
+    virtual void finishPrimaryIndexSerialization(MergeTreeData::DataPart::Checksums & /* checksums */, bool /* sync */) {}
     virtual void finishSkipIndicesSerialization(MergeTreeData::DataPart::Checksums & /* checksums */, bool /* sync */) {}
 
     Columns releaseIndexColumns();
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index dbe41144573..8295b881d87 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -332,7 +332,7 @@ void MergeTreeDataPartWriterOnDisk::finishPrimaryIndexSerialization(
         checksums.files["primary.idx"].file_size = index_stream->count();
         checksums.files["primary.idx"].file_hash = index_stream->getHash();
         if (sync)
-            index_stream->sync();
+            index_file_stream->sync();
         index_stream = nullptr;
     }
 }
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index fdef5d69688..bdc6bade259 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -111,7 +111,7 @@ void MergedBlockOutputStream::writeSuffixAndFinalizePart(
         part_columns = *total_columns_list;
 
     if (new_part->isStoredOnDisk())
-        finalizePartOnDisk(new_part, part_columns, checksums);
+        finalizePartOnDisk(new_part, part_columns, checksums, sync);
 
     new_part->setColumns(part_columns);
     new_part->rows_count = rows_count;
@@ -126,7 +126,8 @@ void MergedBlockOutputStream::writeSuffixAndFinalizePart(
 void MergedBlockOutputStream::finalizePartOnDisk(
     const MergeTreeData::MutableDataPartPtr & new_part,
     NamesAndTypesList & part_columns,
-    MergeTreeData::DataPart::Checksums & checksums)
+    MergeTreeData::DataPart::Checksums & checksums,
+    bool sync)
 {
     if (storage.format_version >= MERGE_TREE_DATA_MIN_FORMAT_VERSION_WITH_CUSTOM_PARTITIONING || isCompactPart(new_part))
     {
@@ -143,6 +144,8 @@ void MergedBlockOutputStream::finalizePartOnDisk(
         count_out_hashing.next();
         checksums.files["count.txt"].file_size = count_out_hashing.count();
         checksums.files["count.txt"].file_hash = count_out_hashing.getHash();
+        if (sync)
+            count_out->sync();
     }
 
     if (!new_part->ttl_infos.empty())
@@ -153,6 +156,8 @@ void MergedBlockOutputStream::finalizePartOnDisk(
         new_part->ttl_infos.write(out_hashing);
         checksums.files["ttl.txt"].file_size = out_hashing.count();
         checksums.files["ttl.txt"].file_hash = out_hashing.getHash();
+        if (sync)
+            out->sync();
     }
 
     removeEmptyColumnsFromPart(new_part, part_columns, checksums);
@@ -161,12 +166,16 @@ void MergedBlockOutputStream::finalizePartOnDisk(
         /// Write a file with a description of columns.
         auto out = volume->getDisk()->writeFile(part_path + "columns.txt", 4096);
         part_columns.writeText(*out);
+        if (sync)
+            out->sync();
     }
 
     {
         /// Write file with checksums.
         auto out = volume->getDisk()->writeFile(part_path + "checksums.txt", 4096);
         checksums.write(*out);
+        if (sync)
+            out->sync();
     }
 }
 
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.h b/src/Storages/MergeTree/MergedBlockOutputStream.h
index 0b500b93f01..87ff9dd1ded 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.h
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.h
@@ -59,7 +59,8 @@ private:
     void finalizePartOnDisk(
             const MergeTreeData::MutableDataPartPtr & new_part,
             NamesAndTypesList & part_columns,
-            MergeTreeData::DataPart::Checksums & checksums);
+            MergeTreeData::DataPart::Checksums & checksums,
+            bool sync);
 
 private:
     NamesAndTypesList columns_list;
diff --git a/utils/durability-test/create_sync.sql b/utils/durability-test/create_sync.sql
new file mode 100644
index 00000000000..2cc88d2c943
--- /dev/null
+++ b/utils/durability-test/create_sync.sql
@@ -0,0 +1 @@
+CREATE TABLE test_sync (a Int, s String) ENGINE = MergeTree ORDER BY a SETTINGS fsync_after_insert = 1, min_compressed_bytes_to_fsync_after_merge = 1;
diff --git a/utils/durability-test/durability-test.sh b/utils/durability-test/durability-test.sh
old mode 100644
new mode 100755
index 1f47c900f49..c7f8936ec95
--- a/utils/durability-test/durability-test.sh
+++ b/utils/durability-test/durability-test.sh
@@ -17,12 +17,12 @@ fi
 
 function run()
 {
-    sshpass -p $PASSWORD ssh -p $SSH_PORT root@localhost "$1"
+    sshpass -p $PASSWORD ssh -p $SSH_PORT root@localhost "$1" 2>/dev/null
 }
 
 function copy()
 {
-    sshpass -p $PASSWORD scp -r -P $SSH_PORT $1 root@localhost:$2
+    sshpass -p $PASSWORD scp -r -P $SSH_PORT $1 root@localhost:$2 2>/dev/null
 }
 
 function wait_vm_for_start()
@@ -50,8 +50,8 @@ function wait_clickhouse_for_start()
 {
     echo "Waiting until ClickHouse started..."
     started=0
-    for i in {0..15}; do
-        run "clickhouse client --query 'select 1'"
+    for i in {0..30}; do
+        run "clickhouse client --query 'select 1'" > /dev/null
         if [ $? -eq 0 ]; then
             started=1
             break
@@ -70,7 +70,7 @@ echo "Downloading image"
 curl -O $URL/$IMAGE
 
 qemu-img resize $IMAGE +10G
-virt-customize -a $IMAGE --root-password password:$PASSWORD
+virt-customize -a $IMAGE --root-password password:$PASSWORD > /dev/null 2>&1
 virt-copy-in -a $IMAGE sshd_config /etc/ssh
 
 echo "Starting VM"
@@ -93,8 +93,8 @@ if [[ -z $CLICKHOUSE_CONFIG_DIR ]]; then
     CLICKHOUSE_CONFIG_DIR=/etc/clickhouse-server
 fi
 
-echo "Using ClickHouse binary: " $CLICKHOUSE_BINARY
-echo "Using ClickHouse config from: " $CLICKHOUSE_CONFIG_DIR
+echo "Using ClickHouse binary:" $CLICKHOUSE_BINARY
+echo "Using ClickHouse config from:" $CLICKHOUSE_CONFIG_DIR
 
 copy $CLICKHOUSE_BINARY /usr/bin
 copy $CLICKHOUSE_CONFIG_DIR /etc
@@ -104,23 +104,19 @@ echo "Prepared VM"
 echo "Starting ClickHouse"
 
 run "clickhouse server --config-file=/etc/clickhouse-server/config.xml > clickhouse-server.log 2>&1" &
-
 wait_clickhouse_for_start
 
-echo "Started ClickHouse"
-
 query=`cat $CREATE_QUERY`
 echo "Executing query:" $query
 run "clickhouse client --query '$query'"
 
 query=`cat $INSERT_QUERY`
 echo "Will run in a loop query: " $query
-run "clickhouse benchmark <<< '$query'" &
+run "clickhouse benchmark <<< '$query' -c 8" &
 echo "Running queries"
 
 pid=`pidof qemu-system-x86_64`
-sec=$(( (RANDOM % 3) + 25 ))
-
+sec=$(( (RANDOM % 5) + 25 ))
 ms=$(( RANDOM % 1000 ))
 
 echo "Will kill VM in $sec.$ms sec"
@@ -130,6 +126,8 @@ kill -9 $pid
 
 echo "Restarting"
 
+sleep 5s
+
 ./startup.exp > qemu.log 2>&1 &
 wait_vm_for_start
 
@@ -137,10 +135,12 @@ run "rm -r *data/system"
 run "clickhouse server --config-file=/etc/clickhouse-server/config.xml > clickhouse-server.log 2>&1" &
 wait_clickhouse_for_start
 
+pid=`pidof qemu-system-x86_64`
 result=`run "grep $TABLE_NAME clickhouse-server.log | grep 'Caught exception while loading metadata'"`
 if [[ -n $result ]]; then
     echo "FAIL. Can't attach table:"
     echo $result
+    kill -9 $pid
     exit 1
 fi
 
@@ -148,7 +148,9 @@ result=`run "grep $TABLE_NAME clickhouse-server.log | grep 'Considering to remov
 if [[ -n $result ]]; then
     echo "FAIL. Have broken parts:"
     echo $result
+    kill -9 $pid
     exit 1
 fi
 
+kill -9 $pid
 echo OK
diff --git a/utils/durability-test/insert_sync.sql b/utils/durability-test/insert_sync.sql
new file mode 100644
index 00000000000..a1ad2ff4ea5
--- /dev/null
+++ b/utils/durability-test/insert_sync.sql
@@ -0,0 +1 @@
+INSERT INTO test_sync SELECT number, toString(number) FROM numbers(10)

From ac5877e601714450a369062abbf80f84485bc6f5 Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Wed, 2 Sep 2020 00:58:39 +0800
Subject: [PATCH 018/341] Fix tests

---
 tests/queries/0_stateless/01447_JSONStrings.reference | 9 +--------
 tests/queries/0_stateless/01447_JSONStrings.sql       | 2 ++
 2 files changed, 3 insertions(+), 8 deletions(-)

diff --git a/tests/queries/0_stateless/01447_JSONStrings.reference b/tests/queries/0_stateless/01447_JSONStrings.reference
index 58af593dc77..1c6f073c0d0 100644
--- a/tests/queries/0_stateless/01447_JSONStrings.reference
+++ b/tests/queries/0_stateless/01447_JSONStrings.reference
@@ -32,12 +32,5 @@
 		["1", "a", "[1,2,3]", "(1,'a')", "ᴺᵁᴸᴸ", "nan"]
 	],
 
-	"rows": 1,
-
-	"statistics":
-	{
-		"elapsed": 0.00068988,
-		"rows_read": 1,
-		"bytes_read": 1
-	}
+	"rows": 1
 }
diff --git a/tests/queries/0_stateless/01447_JSONStrings.sql b/tests/queries/0_stateless/01447_JSONStrings.sql
index 7d89f0f5087..45fc4a56d7a 100644
--- a/tests/queries/0_stateless/01447_JSONStrings.sql
+++ b/tests/queries/0_stateless/01447_JSONStrings.sql
@@ -1,3 +1,5 @@
+SET output_format_write_statistics = 0;
+
 SELECT
     1,
     'a',

From 26d75f76026303b6f3769ab4ea39ff639ebe836a Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Wed, 2 Sep 2020 01:25:10 +0300
Subject: [PATCH 019/341] do fsync for WAL

---
 src/Storages/MergeTree/MergeTreeSettings.h    |  2 ++
 .../MergeTree/MergeTreeWriteAheadLog.cpp      | 32 +++++++++++++++++--
 .../MergeTree/MergeTreeWriteAheadLog.h        | 10 +++++-
 3 files changed, 41 insertions(+), 3 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 1341526c38b..edf03710974 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -43,6 +43,8 @@ struct Settings;
     M(UInt64, min_compressed_bytes_to_fsync_after_fetch, 0, "Minimal number of compressed bytes to do fsync for part after fetch (0 - disabled)", 0) \
     M(Bool, fsync_after_insert, false, "Do fsync for every inserted part. Significantly decreases performance of inserts, not recommended to use with wide parts.", 0) \
     M(Bool, fsync_part_directory, false, "Do fsync for part directory after all part operations (writes, renames, etc.).", 0) \
+    M(UInt64, write_ahead_log_bytes_to_fsync, 100ULL * 1024 * 1024, "Amount of bytes, accumulated in WAL to do fsync.", 0) \
+    M(UInt64, write_ahead_log_interval_ms_to_fsync, 100, "Interval in milliseconds after which fsync for WAL is being done.", 0) \
     \
     /** Inserts settings. */ \
     M(UInt64, parts_to_delay_insert, 150, "If table contains at least that many active parts in single partition, artificially slow down insert into table.", 0) \
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
index eda8579c76a..6f220fc7d5d 100644
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
+++ b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
@@ -4,6 +4,7 @@
 #include <Storages/MergeTree/MergedBlockOutputStream.h>
 #include <IO/ReadHelpers.h>
 #include <Poco/File.h>
+#include <sys/time.h>
 
 namespace DB
 {
@@ -16,17 +17,23 @@ namespace ErrorCodes
     extern const int CORRUPTED_DATA;
 }
 
-
 MergeTreeWriteAheadLog::MergeTreeWriteAheadLog(
-    const MergeTreeData & storage_,
+    MergeTreeData & storage_,
     const DiskPtr & disk_,
     const String & name_)
     : storage(storage_)
     , disk(disk_)
     , name(name_)
     , path(storage.getRelativeDataPath() + name_)
+    , pool(storage.global_context.getSchedulePool())
 {
     init();
+    sync_task = pool.createTask("MergeTreeWriteAheadLog::sync", [this]
+    {
+        std::lock_guard lock(write_mutex);
+        out->sync();
+        sync_scheduled = false;
+    });
 }
 
 void MergeTreeWriteAheadLog::init()
@@ -38,6 +45,7 @@ void MergeTreeWriteAheadLog::init()
     block_out = std::make_unique<NativeBlockOutputStream>(*out, 0, Block{});
     min_block_number = std::numeric_limits<Int64>::max();
     max_block_number = -1;
+    bytes_at_last_sync = 0;
 }
 
 void MergeTreeWriteAheadLog::addPart(const Block & block, const String & part_name)
@@ -53,6 +61,7 @@ void MergeTreeWriteAheadLog::addPart(const Block & block, const String & part_na
     writeStringBinary(part_name, *out);
     block_out->write(block);
     block_out->flush();
+    sync(lock);
 
     auto max_wal_bytes = storage.getSettings()->write_ahead_log_max_bytes;
     if (out->count() > max_wal_bytes)
@@ -66,6 +75,7 @@ void MergeTreeWriteAheadLog::dropPart(const String & part_name)
     writeIntBinary(static_cast<UInt8>(0), *out);
     writeIntBinary(static_cast<UInt8>(ActionType::DROP_PART), *out);
     writeStringBinary(part_name, *out);
+    sync(lock);
 }
 
 void MergeTreeWriteAheadLog::rotate(const std::lock_guard<std::mutex> &)
@@ -175,6 +185,24 @@ MergeTreeData::MutableDataPartsVector MergeTreeWriteAheadLog::restore(const Stor
     return result;
 }
 
+void MergeTreeWriteAheadLog::sync(const std::lock_guard<std::mutex> &)
+{
+    size_t bytes_to_sync = storage.getSettings()->write_ahead_log_bytes_to_fsync;
+    time_t time_to_sync = storage.getSettings()->write_ahead_log_interval_ms_to_fsync;
+    size_t current_bytes = out->count();
+
+    if (bytes_to_sync && current_bytes - bytes_at_last_sync > bytes_to_sync)
+    {
+        sync_task->schedule();
+        bytes_at_last_sync = current_bytes;
+    }
+    else if (time_to_sync && !sync_scheduled)
+    {
+        sync_task->scheduleAfter(time_to_sync);
+        sync_scheduled = true;
+    }
+}
+
 std::optional<MergeTreeWriteAheadLog::MinMaxBlockNumber>
 MergeTreeWriteAheadLog::tryParseMinMaxBlockNumber(const String & filename)
 {
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.h b/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
index 2cc3c2b4181..43abf3c04be 100644
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
+++ b/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
@@ -3,6 +3,7 @@
 #include <DataStreams/NativeBlockInputStream.h>
 #include <DataStreams/NativeBlockOutputStream.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
+#include <Core/BackgroundSchedulePool.h>
 #include <Disks/IDisk.h>
 
 namespace DB
@@ -31,7 +32,7 @@ public:
     constexpr static auto WAL_FILE_EXTENSION = ".bin";
     constexpr static auto DEFAULT_WAL_FILE_NAME = "wal.bin";
 
-    MergeTreeWriteAheadLog(const MergeTreeData & storage_, const DiskPtr & disk_,
+    MergeTreeWriteAheadLog(MergeTreeData & storage_, const DiskPtr & disk_,
         const String & name = DEFAULT_WAL_FILE_NAME);
 
     void addPart(const Block & block, const String & part_name);
@@ -44,6 +45,7 @@ public:
 private:
     void init();
     void rotate(const std::lock_guard<std::mutex> & lock);
+    void sync(const std::lock_guard<std::mutex> & lock);
 
     const MergeTreeData & storage;
     DiskPtr disk;
@@ -56,6 +58,12 @@ private:
     Int64 min_block_number = std::numeric_limits<Int64>::max();
     Int64 max_block_number = -1;
 
+    BackgroundSchedulePool & pool;
+    BackgroundSchedulePoolTaskHolder sync_task;
+
+    size_t bytes_at_last_sync = 0;
+    bool sync_scheduled = false;
+
     mutable std::mutex write_mutex;
 };
 

From a80c1adee81631f770f642ad4430a8ff44ff46af Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Wed, 2 Sep 2020 12:05:02 +0800
Subject: [PATCH 020/341] Add JSONCompactStrings formats

---
 docs/en/interfaces/formats.md                 | 288 +++++++++++-------
 src/Formats/FormatFactory.cpp                 |   6 -
 .../Impl/JSONCompactEachRowRowInputFormat.cpp |  49 ++-
 .../Impl/JSONCompactEachRowRowInputFormat.h   |  11 +-
 .../JSONCompactEachRowRowOutputFormat.cpp     |  37 ++-
 .../Impl/JSONCompactEachRowRowOutputFormat.h  |   9 +-
 .../Impl/JSONCompactRowOutputFormat.cpp       |  30 +-
 .../Formats/Impl/JSONCompactRowOutputFormat.h |  10 +-
 .../Impl/JSONEachRowRowInputFormat.cpp        |  42 ++-
 .../Formats/Impl/JSONEachRowRowInputFormat.h  |   9 +-
 .../Impl/JSONEachRowRowOutputFormat.cpp       |  32 +-
 .../Formats/Impl/JSONEachRowRowOutputFormat.h |  10 +-
 ...JSONEachRowWithProgressRowOutputFormat.cpp |  11 +-
 .../Formats/Impl/JSONRowOutputFormat.cpp      |  44 ++-
 .../Formats/Impl/JSONRowOutputFormat.h        |   9 +-
 .../Impl/JSONStringsEachRowRowInputFormat.cpp | 245 ---------------
 .../Impl/JSONStringsEachRowRowInputFormat.h   |  54 ----
 .../JSONStringsEachRowRowOutputFormat.cpp     | 117 -------
 .../Impl/JSONStringsEachRowRowOutputFormat.h  |  45 ---
 .../Impl/JSONStringsRowOutputFormat.cpp       |  93 ------
 .../Formats/Impl/JSONStringsRowOutputFormat.h |  43 ---
 .../0_stateless/01446_JSONStringsEachRow.sql  |  63 ----
 .../01446_json_strings_each_row.reference     |  22 ++
 .../01446_json_strings_each_row.sql           |  38 +++
 .../0_stateless/01447_json_strings.reference  |  43 +++
 ...JSONStrings.sql => 01447_json_strings.sql} |   0
 ...8_json_compact_strings_each_row.reference} |   0
 .../01448_json_compact_strings_each_row.sql   |  63 ++++
 ...e => 01449_json_compact_strings.reference} |   0
 .../01449_json_compact_strings.sql            |  10 +
 30 files changed, 621 insertions(+), 812 deletions(-)
 delete mode 100644 src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.cpp
 delete mode 100644 src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h
 delete mode 100644 src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp
 delete mode 100644 src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h
 delete mode 100644 src/Processors/Formats/Impl/JSONStringsRowOutputFormat.cpp
 delete mode 100644 src/Processors/Formats/Impl/JSONStringsRowOutputFormat.h
 delete mode 100644 tests/queries/0_stateless/01446_JSONStringsEachRow.sql
 create mode 100644 tests/queries/0_stateless/01446_json_strings_each_row.reference
 create mode 100644 tests/queries/0_stateless/01446_json_strings_each_row.sql
 create mode 100644 tests/queries/0_stateless/01447_json_strings.reference
 rename tests/queries/0_stateless/{01447_JSONStrings.sql => 01447_json_strings.sql} (100%)
 rename tests/queries/0_stateless/{01446_JSONStringsEachRow.reference => 01448_json_compact_strings_each_row.reference} (100%)
 create mode 100644 tests/queries/0_stateless/01448_json_compact_strings_each_row.sql
 rename tests/queries/0_stateless/{01447_JSONStrings.reference => 01449_json_compact_strings.reference} (100%)
 create mode 100644 tests/queries/0_stateless/01449_json_compact_strings.sql

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 9c7c2dda8dc..bfe5b6218e4 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -10,45 +10,51 @@ results of a `SELECT`, and to perform `INSERT`s into a file-backed table.
 
 The supported formats are:
 
-| Format                                                          | Input | Output |
-|-----------------------------------------------------------------|-------|--------|
-| [TabSeparated](#tabseparated)                                   | ✔     | ✔      |
-| [TabSeparatedRaw](#tabseparatedraw)                             | ✔     | ✔      |
-| [TabSeparatedWithNames](#tabseparatedwithnames)                 | ✔     | ✔      |
-| [TabSeparatedWithNamesAndTypes](#tabseparatedwithnamesandtypes) | ✔     | ✔      |
-| [Template](#format-template)                                    | ✔     | ✔      |
-| [TemplateIgnoreSpaces](#templateignorespaces)                   | ✔     | ✗      |
-| [CSV](#csv)                                                     | ✔     | ✔      |
-| [CSVWithNames](#csvwithnames)                                   | ✔     | ✔      |
-| [CustomSeparated](#format-customseparated)                      | ✔     | ✔      |
-| [Values](#data-format-values)                                   | ✔     | ✔      |
-| [Vertical](#vertical)                                           | ✗     | ✔      |
-| [VerticalRaw](#verticalraw)                                     | ✗     | ✔      |
-| [JSON](#json)                                                   | ✗     | ✔      |
-| [JSONCompact](#jsoncompact)                                     | ✗     | ✔      |
-| [JSONStrings](#jsonstrings)                                     | ✗     | ✔      |
-| [JSONEachRow](#jsoneachrow)                                     | ✔     | ✔      |
-| [JSONCompactEachRow](#jsoncompacteachrow)                       | ✔     | ✔      |
-| [JSONStringsEachRow](#jsonstringseachrow)                       | ✔     | ✔      |
-| [TSKV](#tskv)                                                   | ✔     | ✔      |
-| [Pretty](#pretty)                                               | ✗     | ✔      |
-| [PrettyCompact](#prettycompact)                                 | ✗     | ✔      |
-| [PrettyCompactMonoBlock](#prettycompactmonoblock)               | ✗     | ✔      |
-| [PrettyNoEscapes](#prettynoescapes)                             | ✗     | ✔      |
-| [PrettySpace](#prettyspace)                                     | ✗     | ✔      |
-| [Protobuf](#protobuf)                                           | ✔     | ✔      |
-| [Avro](#data-format-avro)                                       | ✔     | ✔      |
-| [AvroConfluent](#data-format-avro-confluent)                    | ✔     | ✗      |
-| [Parquet](#data-format-parquet)                                 | ✔     | ✔      |
-| [Arrow](#data-format-arrow)                                     | ✔     | ✔      |
-| [ArrowStream](#data-format-arrow-stream)                        | ✔     | ✔      |
-| [ORC](#data-format-orc)                                         | ✔     | ✗      |
-| [RowBinary](#rowbinary)                                         | ✔     | ✔      |
-| [RowBinaryWithNamesAndTypes](#rowbinarywithnamesandtypes)       | ✔     | ✔      |
-| [Native](#native)                                               | ✔     | ✔      |
-| [Null](#null)                                                   | ✗     | ✔      |
-| [XML](#xml)                                                     | ✗     | ✔      |
-| [CapnProto](#capnproto)                                         | ✔     | ✗      |
+| Format                                                                                  | Input | Output |
+|-----------------------------------------------------------------------------------------|-------|--------|
+| [TabSeparated](#tabseparated)                                                           | ✔     | ✔      |
+| [TabSeparatedRaw](#tabseparatedraw)                                                     | ✔     | ✔      |
+| [TabSeparatedWithNames](#tabseparatedwithnames)                                         | ✔     | ✔      |
+| [TabSeparatedWithNamesAndTypes](#tabseparatedwithnamesandtypes)                         | ✔     | ✔      |
+| [Template](#format-template)                                                            | ✔     | ✔      |
+| [TemplateIgnoreSpaces](#templateignorespaces)                                           | ✔     | ✗      |
+| [CSV](#csv)                                                                             | ✔     | ✔      |
+| [CSVWithNames](#csvwithnames)                                                           | ✔     | ✔      |
+| [CustomSeparated](#format-customseparated)                                              | ✔     | ✔      |
+| [Values](#data-format-values)                                                           | ✔     | ✔      |
+| [Vertical](#vertical)                                                                   | ✗     | ✔      |
+| [VerticalRaw](#verticalraw)                                                             | ✗     | ✔      |
+| [JSON](#json)                                                                           | ✗     | ✔      |
+| [JSONString](#jsonstring)                                                               | ✗     | ✔      |
+| [JSONCompact](#jsoncompact)                                                             | ✗     | ✔      |
+| [JSONCompactString](#jsoncompactstring)                                                 | ✗     | ✔      |
+| [JSONEachRow](#jsoneachrow)                                                             | ✔     | ✔      |
+| [JSONEachRowWithProgress](#jsoneachrowwithprogress)                                     | ✗     | ✔      |
+| [JSONStringEachRow](#jsonstringeachrow)                                                 | ✔     | ✔      |
+| [JSONStringEachRowWithProgress](#jsonstringeachrowwithprogress)                         | ✗     | ✔      |
+| [JSONCompactEachRow](#jsoncompacteachrow)                                               | ✔     | ✔      |
+| [JSONCompactEachRowWithNamesAndTypes](#jsoncompacteachrowwithnamesandtypes)             | ✔     | ✔      |
+| [JSONCompactStringEachRow](#jsoncompactstringeachrow)                                   | ✔     | ✔      |
+| [JSONCompactStringEachRowWithNamesAndTypes](#jsoncompactstringeachrowwithnamesandtypes) | ✔     | ✔      |
+| [TSKV](#tskv)                                                                           | ✔     | ✔      |
+| [Pretty](#pretty)                                                                       | ✗     | ✔      |
+| [PrettyCompact](#prettycompact)                                                         | ✗     | ✔      |
+| [PrettyCompactMonoBlock](#prettycompactmonoblock)                                       | ✗     | ✔      |
+| [PrettyNoEscapes](#prettynoescapes)                                                     | ✗     | ✔      |
+| [PrettySpace](#prettyspace)                                                             | ✗     | ✔      |
+| [Protobuf](#protobuf)                                                                   | ✔     | ✔      |
+| [Avro](#data-format-avro)                                                               | ✔     | ✔      |
+| [AvroConfluent](#data-format-avro-confluent)                                            | ✔     | ✗      |
+| [Parquet](#data-format-parquet)                                                         | ✔     | ✔      |
+| [Arrow](#data-format-arrow)                                                             | ✔     | ✔      |
+| [ArrowStream](#data-format-arrow-stream)                                                | ✔     | ✔      |
+| [ORC](#data-format-orc)                                                                 | ✔     | ✗      |
+| [RowBinary](#rowbinary)                                                                 | ✔     | ✔      |
+| [RowBinaryWithNamesAndTypes](#rowbinarywithnamesandtypes)                               | ✔     | ✔      |
+| [Native](#native)                                                                       | ✔     | ✔      |
+| [Null](#null)                                                                           | ✗     | ✔      |
+| [XML](#xml)                                                                             | ✗     | ✔      |
+| [CapnProto](#capnproto)                                                                 | ✔     | ✗      |
 
 You can control some format processing parameters with the ClickHouse settings. For more information read the [Settings](../operations/settings/settings.md) section.
 
@@ -395,62 +401,41 @@ SELECT SearchPhrase, count() AS c FROM test.hits GROUP BY SearchPhrase WITH TOTA
         "meta":
         [
                 {
-                        "name": "SearchPhrase",
+                        "name": "'hello'",
                         "type": "String"
                 },
                 {
-                        "name": "c",
+                        "name": "multiply(42, number)",
                         "type": "UInt64"
+                },
+                {
+                        "name": "range(5)",
+                        "type": "Array(UInt8)"
                 }
         ],
 
         "data":
         [
                 {
-                        "SearchPhrase": "",
-                        "c": "8267016"
+                        "'hello'": "hello",
+                        "multiply(42, number)": "0",
+                        "range(5)": [0,1,2,3,4]
                 },
                 {
-                        "SearchPhrase": "bathroom interior design",
-                        "c": "2166"
+                        "'hello'": "hello",
+                        "multiply(42, number)": "42",
+                        "range(5)": [0,1,2,3,4]
                 },
                 {
-                        "SearchPhrase": "yandex",
-                        "c": "1655"
-                },
-                {
-                        "SearchPhrase": "spring 2014 fashion",
-                        "c": "1549"
-                },
-                {
-                        "SearchPhrase": "freeform photos",
-                        "c": "1480"
+                        "'hello'": "hello",
+                        "multiply(42, number)": "84",
+                        "range(5)": [0,1,2,3,4]
                 }
         ],
 
-        "totals":
-        {
-                "SearchPhrase": "",
-                "c": "8873898"
-        },
+        "rows": 3,
 
-        "extremes":
-        {
-                "min":
-                {
-                        "SearchPhrase": "",
-                        "c": "1480"
-                },
-                "max":
-                {
-                        "SearchPhrase": "",
-                        "c": "8267016"
-                }
-        },
-
-        "rows": 5,
-
-        "rows_before_limit_at_least": 141137
+        "rows_before_limit_at_least": 3
 }
 ```
 
@@ -471,73 +456,166 @@ ClickHouse supports [NULL](../sql-reference/syntax.md), which is displayed as `n
 
 See also the [JSONEachRow](#jsoneachrow) format.
 
-## JSONCompact {#jsoncompact}
+## JSONString {#jsonstring}
 
-Differs from JSON only in that data rows are output in arrays of any element type, not in objects.
+Differs from JSON only in that data fields are output in strings, not in typed json values.
 
 Example:
 
-``` json
+```json
 {
         "meta":
         [
                 {
-                        "name": "SearchPhrase",
+                        "name": "'hello'",
                         "type": "String"
                 },
                 {
-                        "name": "c",
+                        "name": "multiply(42, number)",
                         "type": "UInt64"
+                },
+                {
+                        "name": "range(5)",
+                        "type": "Array(UInt8)"
                 }
         ],
 
         "data":
         [
-                ["", "8267016"],
-                ["bathroom interior design", "2166"],
-                ["yandex", "1655"],
-                ["fashion trends spring 2014", "1549"],
-                ["freeform photo", "1480"]
+                {
+                        "'hello'": "hello",
+                        "multiply(42, number)": "0",
+                        "range(5)": "[0,1,2,3,4]"
+                },
+                {
+                        "'hello'": "hello",
+                        "multiply(42, number)": "42",
+                        "range(5)": "[0,1,2,3,4]"
+                },
+                {
+                        "'hello'": "hello",
+                        "multiply(42, number)": "84",
+                        "range(5)": "[0,1,2,3,4]"
+                }
         ],
 
-        "totals": ["","8873898"],
+        "rows": 3,
 
-        "extremes":
-        {
-                "min": ["","1480"],
-                "max": ["","8267016"]
-        },
-
-        "rows": 5,
-
-        "rows_before_limit_at_least": 141137
+        "rows_before_limit_at_least": 3
 }
 ```
 
-This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
-See also the `JSONEachRow` format.
+## JSONCompact {#jsoncompact}
+## JSONCompactString {#jsoncompactstring}
 
-## JSONStrings {#jsonstrings}
+Differs from JSON only in that data rows are output in arrays, not in objects.
 
-Differs from JSON and JSONCompact only in that data rows are output in arrays of strings.
+Example:
 
-This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
-See also the `JSONEachRow` format.
+``` json
+// JSONCompact
+{
+        "meta":
+        [
+                {
+                        "name": "'hello'",
+                        "type": "String"
+                },
+                {
+                        "name": "multiply(42, number)",
+                        "type": "UInt64"
+                },
+                {
+                        "name": "range(5)",
+                        "type": "Array(UInt8)"
+                }
+        ],
+
+        "data":
+        [
+                ["hello", "0", [0,1,2,3,4]],
+                ["hello", "42", [0,1,2,3,4]],
+                ["hello", "84", [0,1,2,3,4]]
+        ],
+
+        "rows": 3,
+
+        "rows_before_limit_at_least": 3
+}
+```
+
+```json
+// JSONCompactString
+{
+        "meta":
+        [
+                {
+                        "name": "'hello'",
+                        "type": "String"
+                },
+                {
+                        "name": "multiply(42, number)",
+                        "type": "UInt64"
+                },
+                {
+                        "name": "range(5)",
+                        "type": "Array(UInt8)"
+                }
+        ],
+
+        "data":
+        [
+                ["hello", "0", "[0,1,2,3,4]"],
+                ["hello", "42", "[0,1,2,3,4]"],
+                ["hello", "84", "[0,1,2,3,4]"]
+        ],
+
+        "rows": 3,
+
+        "rows_before_limit_at_least": 3
+}
+```
 
 ## JSONEachRow {#jsoneachrow}
+## JSONStringEachRow {#jsonstringeachrow}
 ## JSONCompactEachRow {#jsoncompacteachrow}
-## JSONStringsEachRow {#jsonstringseachrow}
+## JSONCompactStringEachRow {#jsoncompactstringeachrow}
 
 When using these formats, ClickHouse outputs rows as separated, newline-delimited JSON values, but the data as a whole is not valid JSON.
 
 ``` json
 {"some_int":42,"some_str":"hello","some_tuple":[1,"a"]} // JSONEachRow
 [42,"hello",[1,"a"]] // JSONCompactEachRow
-["42","hello","(2,'a')"] // JSONStringsEachRow
+["42","hello","(2,'a')"] // JSONCompactStringsEachRow
 ```
 
 When inserting the data, you should provide a separate JSON value for each row.
 
+## JSONEachRowWithProgress {#jsoneachrowwithprogress}
+## JSONStringEachRowWithProgress {#jsonstringeachrowwithprogress}
+
+Differs from JSONEachRow/JSONStringEachRow in that ClickHouse will also yield progress information as JSON objects.
+
+```json
+{"row":{"'hello'":"hello","multiply(42, number)":"0","range(5)":[0,1,2,3,4]}}
+{"row":{"'hello'":"hello","multiply(42, number)":"42","range(5)":[0,1,2,3,4]}}
+{"row":{"'hello'":"hello","multiply(42, number)":"84","range(5)":[0,1,2,3,4]}}
+{"progress":{"read_rows":"3","read_bytes":"24","written_rows":"0","written_bytes":"0","total_rows_to_read":"3"}}
+```
+
+## JSONCompactEachRowWithNamesAndTypes {#jsoncompacteachrowwithnamesandtypes}
+## JSONCompactStringEachRowWithNamesAndTypes {#jsoncompactstringeachrowwithnamesandtypes}
+
+Differs from JSONCompactEachRow/JSONCompactStringEachRow in that the column names and types are written as the first two rows.
+
+```json
+["'hello'", "multiply(42, number)", "range(5)"]
+["String", "UInt64", "Array(UInt8)"]
+["hello", "0", [0,1,2,3,4]]
+["hello", "42", [0,1,2,3,4]]
+["hello", "84", [0,1,2,3,4]]
+```
+
 ### Inserting Data {#inserting-data}
 
 ``` sql
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index cb378fbea96..871098e00c0 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -352,8 +352,6 @@ void registerInputFormatProcessorJSONEachRow(FormatFactory & factory);
 void registerOutputFormatProcessorJSONEachRow(FormatFactory & factory);
 void registerInputFormatProcessorJSONCompactEachRow(FormatFactory & factory);
 void registerOutputFormatProcessorJSONCompactEachRow(FormatFactory & factory);
-void registerInputFormatProcessorJSONStringsEachRow(FormatFactory & factory);
-void registerOutputFormatProcessorJSONStringsEachRow(FormatFactory & factory);
 void registerInputFormatProcessorProtobuf(FormatFactory & factory);
 void registerOutputFormatProcessorProtobuf(FormatFactory & factory);
 void registerInputFormatProcessorTemplate(FormatFactory & factory);
@@ -380,7 +378,6 @@ void registerOutputFormatProcessorVertical(FormatFactory & factory);
 void registerOutputFormatProcessorJSON(FormatFactory & factory);
 void registerOutputFormatProcessorJSONCompact(FormatFactory & factory);
 void registerOutputFormatProcessorJSONEachRowWithProgress(FormatFactory & factory);
-void registerOutputFormatProcessorJSONStrings(FormatFactory & factory);
 void registerOutputFormatProcessorXML(FormatFactory & factory);
 void registerOutputFormatProcessorODBCDriver2(FormatFactory & factory);
 void registerOutputFormatProcessorNull(FormatFactory & factory);
@@ -421,8 +418,6 @@ FormatFactory::FormatFactory()
     registerOutputFormatProcessorJSONEachRow(*this);
     registerInputFormatProcessorJSONCompactEachRow(*this);
     registerOutputFormatProcessorJSONCompactEachRow(*this);
-    registerInputFormatProcessorJSONStringsEachRow(*this);
-    registerOutputFormatProcessorJSONStringsEachRow(*this);
     registerInputFormatProcessorProtobuf(*this);
     registerOutputFormatProcessorProtobuf(*this);
     registerInputFormatProcessorTemplate(*this);
@@ -449,7 +444,6 @@ FormatFactory::FormatFactory()
     registerOutputFormatProcessorJSON(*this);
     registerOutputFormatProcessorJSONCompact(*this);
     registerOutputFormatProcessorJSONEachRowWithProgress(*this);
-    registerOutputFormatProcessorJSONStrings(*this);
     registerOutputFormatProcessorXML(*this);
     registerOutputFormatProcessorODBCDriver2(*this);
     registerOutputFormatProcessorNull(*this);
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
index 82e3cb795bf..eb697ce5318 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
@@ -1,4 +1,5 @@
 #include <IO/ReadHelpers.h>
+#include <IO/ReadBufferFromString.h>
 
 #include <Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h>
 #include <Formats/FormatFactory.h>
@@ -19,8 +20,9 @@ JSONCompactEachRowRowInputFormat::JSONCompactEachRowRowInputFormat(ReadBuffer &
         const Block & header_,
         Params params_,
         const FormatSettings & format_settings_,
-        bool with_names_)
-        : IRowInputFormat(header_, in_, std::move(params_)), format_settings(format_settings_), with_names(with_names_)
+        bool with_names_,
+        bool yield_strings_)
+        : IRowInputFormat(header_, in_, std::move(params_)), format_settings(format_settings_), with_names(with_names_), yield_strings(yield_strings_)
 {
     const auto & sample = getPort().getHeader();
     size_t num_columns = sample.columns();
@@ -200,10 +202,25 @@ void JSONCompactEachRowRowInputFormat::readField(size_t index, MutableColumns &
     {
         read_columns[index] = true;
         const auto & type = data_types[index];
-        if (format_settings.null_as_default && !type->isNullable())
-            read_columns[index] = DataTypeNullable::deserializeTextJSON(*columns[index], in, format_settings, type);
+
+        if (yield_strings)
+        {
+            // notice: null_as_default on "null" strings is not supported
+
+            String str;
+            readJSONString(str, in);
+
+            ReadBufferFromString buf(str);
+
+            type->deserializeAsWholeText(*columns[index], buf, format_settings);
+        }
         else
-            type->deserializeAsTextJSON(*columns[index], in, format_settings);
+        {
+            if (format_settings.null_as_default && !type->isNullable())
+                read_columns[index] = DataTypeNullable::deserializeTextJSON(*columns[index], in, format_settings, type);
+            else
+                type->deserializeAsTextJSON(*columns[index], in, format_settings);
+        }
     }
     catch (Exception & e)
     {
@@ -225,7 +242,7 @@ void registerInputFormatProcessorJSONCompactEachRow(FormatFactory & factory)
             IRowInputFormat::Params params,
             const FormatSettings & settings)
     {
-        return std::make_shared<JSONCompactEachRowRowInputFormat>(buf, sample, std::move(params), settings, false);
+        return std::make_shared<JSONCompactEachRowRowInputFormat>(buf, sample, std::move(params), settings, false, false);
     });
 
     factory.registerInputFormatProcessor("JSONCompactEachRowWithNamesAndTypes", [](
@@ -234,7 +251,25 @@ void registerInputFormatProcessorJSONCompactEachRow(FormatFactory & factory)
             IRowInputFormat::Params params,
             const FormatSettings & settings)
     {
-        return std::make_shared<JSONCompactEachRowRowInputFormat>(buf, sample, std::move(params), settings, true);
+        return std::make_shared<JSONCompactEachRowRowInputFormat>(buf, sample, std::move(params), settings, true, false);
+    });
+
+    factory.registerInputFormatProcessor("JSONCompactStringsEachRow", [](
+            ReadBuffer & buf,
+            const Block & sample,
+            IRowInputFormat::Params params,
+            const FormatSettings & settings)
+    {
+        return std::make_shared<JSONCompactEachRowRowInputFormat>(buf, sample, std::move(params), settings, false, true);
+    });
+
+    factory.registerInputFormatProcessor("JSONCompactStringsEachRowWithNamesAndTypes", [](
+            ReadBuffer & buf,
+            const Block & sample,
+            IRowInputFormat::Params params,
+            const FormatSettings & settings)
+    {
+        return std::make_shared<JSONCompactEachRowRowInputFormat>(buf, sample, std::move(params), settings, true, true);
     });
 }
 
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
index 5c864ebc751..593f297108c 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
@@ -12,12 +12,18 @@ namespace DB
 
 class ReadBuffer;
 
-/** A stream for reading data in JSONCompactEachRow and JSONCompactEachRowWithNamesAndTypes formats
+/** A stream for reading data in JSONCompactEachRow- formats
 */
 class JSONCompactEachRowRowInputFormat : public IRowInputFormat
 {
 public:
-    JSONCompactEachRowRowInputFormat(ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_, bool with_names_);
+    JSONCompactEachRowRowInputFormat(
+        ReadBuffer & in_,
+        const Block & header_,
+        Params params_,
+        const FormatSettings & format_settings_,
+        bool with_names_,
+        bool yield_strings_);
 
     String getName() const override { return "JSONCompactEachRowRowInputFormat"; }
 
@@ -49,6 +55,7 @@ private:
     std::vector<String> names_of_columns;
 
     bool with_names;
+    bool yield_strings;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
index e155dcb4247..ab8fd164c3c 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
@@ -12,8 +12,9 @@ JSONCompactEachRowRowOutputFormat::JSONCompactEachRowRowOutputFormat(WriteBuffer
         const Block & header_,
         FormatFactory::WriteCallback callback,
         const FormatSettings & settings_,
-        bool with_names_)
-        : IRowOutputFormat(header_, out_, callback), settings(settings_), with_names(with_names_)
+        bool with_names_,
+        bool yield_strings_)
+        : IRowOutputFormat(header_, out_, callback), settings(settings_), with_names(with_names_), yield_strings(yield_strings_)
 {
             const auto & sample = getPort(PortKind::Main).getHeader();
             NamesAndTypesList columns(sample.getNamesAndTypesList());
@@ -23,7 +24,15 @@ JSONCompactEachRowRowOutputFormat::JSONCompactEachRowRowOutputFormat(WriteBuffer
 
 void JSONCompactEachRowRowOutputFormat::writeField(const IColumn & column, const IDataType & type, size_t row_num)
 {
-    type.serializeAsTextJSON(column, row_num, out, settings);
+    if (yield_strings)
+    {
+        WriteBufferFromOwnString buf;
+
+        type.serializeAsText(column, row_num, buf, settings);
+        writeJSONString(buf.str(), out, settings);
+    }
+    else
+        type.serializeAsTextJSON(column, row_num, out, settings);
 }
 
 
@@ -97,7 +106,7 @@ void registerOutputFormatProcessorJSONCompactEachRow(FormatFactory & factory)
             FormatFactory::WriteCallback callback,
             const FormatSettings & format_settings)
     {
-        return std::make_shared<JSONCompactEachRowRowOutputFormat>(buf, sample, callback, format_settings, false);
+        return std::make_shared<JSONCompactEachRowRowOutputFormat>(buf, sample, callback, format_settings, false, false);
     });
 
     factory.registerOutputFormatProcessor("JSONCompactEachRowWithNamesAndTypes", [](
@@ -106,7 +115,25 @@ void registerOutputFormatProcessorJSONCompactEachRow(FormatFactory & factory)
             FormatFactory::WriteCallback callback,
             const FormatSettings &format_settings)
     {
-        return std::make_shared<JSONCompactEachRowRowOutputFormat>(buf, sample, callback, format_settings, true);
+        return std::make_shared<JSONCompactEachRowRowOutputFormat>(buf, sample, callback, format_settings, true, false);
+    });
+
+    factory.registerOutputFormatProcessor("JSONCompactStringsEachRow", [](
+            WriteBuffer & buf,
+            const Block & sample,
+            FormatFactory::WriteCallback callback,
+            const FormatSettings & format_settings)
+    {
+        return std::make_shared<JSONCompactEachRowRowOutputFormat>(buf, sample, callback, format_settings, false, true);
+    });
+
+    factory.registerOutputFormatProcessor("JSONCompactStringsEachRowWithNamesAndTypes", [](
+            WriteBuffer &buf,
+            const Block &sample,
+            FormatFactory::WriteCallback callback,
+            const FormatSettings &format_settings)
+    {
+        return std::make_shared<JSONCompactEachRowRowOutputFormat>(buf, sample, callback, format_settings, true, true);
     });
 }
 
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
index a7857a82d2d..56936783e78 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
@@ -15,7 +15,13 @@ namespace DB
 class JSONCompactEachRowRowOutputFormat : public IRowOutputFormat
 {
 public:
-    JSONCompactEachRowRowOutputFormat(WriteBuffer & out_, const Block & header_, FormatFactory::WriteCallback callback, const FormatSettings & settings_, bool with_names);
+    JSONCompactEachRowRowOutputFormat(
+        WriteBuffer & out_,
+        const Block & header_,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & settings_,
+        bool with_names_,
+        bool yield_strings_);
 
     String getName() const override { return "JSONCompactEachRowRowOutputFormat"; }
 
@@ -41,5 +47,6 @@ private:
     NamesAndTypes fields;
 
     bool with_names;
+    bool yield_strings;
 };
 }
diff --git a/src/Processors/Formats/Impl/JSONCompactRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONCompactRowOutputFormat.cpp
index 7e56a4643da..c36942cff09 100644
--- a/src/Processors/Formats/Impl/JSONCompactRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONCompactRowOutputFormat.cpp
@@ -8,15 +8,28 @@ namespace DB
 {
 
 JSONCompactRowOutputFormat::JSONCompactRowOutputFormat(
-    WriteBuffer & out_, const Block & header, FormatFactory::WriteCallback callback, const FormatSettings & settings_)
-    : JSONRowOutputFormat(out_, header, callback, settings_)
+    WriteBuffer & out_,
+    const Block & header,
+    FormatFactory::WriteCallback callback,
+    const FormatSettings & settings_,
+    bool yield_strings_)
+    : JSONRowOutputFormat(out_, header, callback, settings_, yield_strings_)
 {
 }
 
 
 void JSONCompactRowOutputFormat::writeField(const IColumn & column, const IDataType & type, size_t row_num)
 {
-    type.serializeAsTextJSON(column, row_num, *ostr, settings);
+    if (yield_strings)
+    {
+        WriteBufferFromOwnString buf;
+
+        type.serializeAsText(column, row_num, buf, settings);
+        writeJSONString(buf.str(), *ostr, settings);
+    }
+    else
+        type.serializeAsTextJSON(column, row_num, *ostr, settings);
+
     ++field_number;
 }
 
@@ -83,7 +96,16 @@ void registerOutputFormatProcessorJSONCompact(FormatFactory & factory)
         FormatFactory::WriteCallback callback,
         const FormatSettings & format_settings)
     {
-        return std::make_shared<JSONCompactRowOutputFormat>(buf, sample, callback, format_settings);
+        return std::make_shared<JSONCompactRowOutputFormat>(buf, sample, callback, format_settings, false);
+    });
+
+    factory.registerOutputFormatProcessor("JSONCompactStrings", [](
+        WriteBuffer & buf,
+        const Block & sample,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & format_settings)
+    {
+        return std::make_shared<JSONCompactRowOutputFormat>(buf, sample, callback, format_settings, true);
     });
 }
 
diff --git a/src/Processors/Formats/Impl/JSONCompactRowOutputFormat.h b/src/Processors/Formats/Impl/JSONCompactRowOutputFormat.h
index f4002f74287..6585016c44f 100644
--- a/src/Processors/Formats/Impl/JSONCompactRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONCompactRowOutputFormat.h
@@ -11,12 +11,17 @@ namespace DB
 
 struct FormatSettings;
 
-/** The stream for outputting data in the JSONCompact format.
+/** The stream for outputting data in the JSONCompact- formats.
   */
 class JSONCompactRowOutputFormat : public JSONRowOutputFormat
 {
 public:
-    JSONCompactRowOutputFormat(WriteBuffer & out_, const Block & header, FormatFactory::WriteCallback callback, const FormatSettings & settings_);
+    JSONCompactRowOutputFormat(
+        WriteBuffer & out_,
+        const Block & header,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & settings_,
+        bool yield_strings_);
 
     String getName() const override { return "JSONCompactRowOutputFormat"; }
 
@@ -37,7 +42,6 @@ protected:
     }
 
     void writeTotalsFieldDelimiter() override;
-
 };
 
 }
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
index 6350db3b211..9ba82fbb009 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
@@ -1,4 +1,5 @@
 #include <IO/ReadHelpers.h>
+#include <IO/ReadBufferFromString.h>
 
 #include <Processors/Formats/Impl/JSONEachRowRowInputFormat.h>
 #include <Formats/JSONEachRowUtils.h>
@@ -29,8 +30,12 @@ enum
 
 
 JSONEachRowRowInputFormat::JSONEachRowRowInputFormat(
-    ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_)
-    : IRowInputFormat(header_, in_, std::move(params_)), format_settings(format_settings_), name_map(header_.columns())
+    ReadBuffer & in_,
+    const Block & header_,
+    Params params_,
+    const FormatSettings & format_settings_,
+    bool yield_strings_)
+    : IRowInputFormat(header_, in_, std::move(params_)), format_settings(format_settings_), name_map(header_.columns()), yield_strings(yield_strings_)
 {
     /// In this format, BOM at beginning of stream cannot be confused with value, so it is safe to skip it.
     skipBOMIfExists(in);
@@ -138,10 +143,25 @@ void JSONEachRowRowInputFormat::readField(size_t index, MutableColumns & columns
     {
         seen_columns[index] = read_columns[index] = true;
         const auto & type = getPort().getHeader().getByPosition(index).type;
-        if (format_settings.null_as_default && !type->isNullable())
-            read_columns[index] = DataTypeNullable::deserializeTextJSON(*columns[index], in, format_settings, type);
+
+        if (yield_strings)
+        {
+            // notice: null_as_default on "null" strings is not supported
+
+            String str;
+            readJSONString(str, in);
+
+            ReadBufferFromString buf(str);
+
+            type->deserializeAsWholeText(*columns[index], buf, format_settings);
+        }
         else
-            type->deserializeAsTextJSON(*columns[index], in, format_settings);
+        {
+            if (format_settings.null_as_default && !type->isNullable())
+                read_columns[index] = DataTypeNullable::deserializeTextJSON(*columns[index], in, format_settings, type);
+            else
+                type->deserializeAsTextJSON(*columns[index], in, format_settings);
+        }
     }
     catch (Exception & e)
     {
@@ -318,13 +338,23 @@ void registerInputFormatProcessorJSONEachRow(FormatFactory & factory)
         IRowInputFormat::Params params,
         const FormatSettings & settings)
     {
-        return std::make_shared<JSONEachRowRowInputFormat>(buf, sample, std::move(params), settings);
+        return std::make_shared<JSONEachRowRowInputFormat>(buf, sample, std::move(params), settings, false);
+    });
+
+    factory.registerInputFormatProcessor("JSONStringsEachRow", [](
+        ReadBuffer & buf,
+        const Block & sample,
+        IRowInputFormat::Params params,
+        const FormatSettings & settings)
+    {
+        return std::make_shared<JSONEachRowRowInputFormat>(buf, sample, std::move(params), settings, true);
     });
 }
 
 void registerFileSegmentationEngineJSONEachRow(FormatFactory & factory)
 {
     factory.registerFileSegmentationEngine("JSONEachRow", &fileSegmentationEngineJSONEachRowImpl);
+    factory.registerFileSegmentationEngine("JSONStringsEachRow", &fileSegmentationEngineJSONEachRowImpl);
 }
 
 }
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.h b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.h
index a0a4b735a3e..29a6ce6ecb8 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.h
@@ -20,7 +20,12 @@ class ReadBuffer;
 class JSONEachRowRowInputFormat : public IRowInputFormat
 {
 public:
-    JSONEachRowRowInputFormat(ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_);
+    JSONEachRowRowInputFormat(
+        ReadBuffer & in_,
+        const Block & header_,
+        Params params_,
+        const FormatSettings & format_settings_,
+        bool yield_strings_);
 
     String getName() const override { return "JSONEachRowRowInputFormat"; }
 
@@ -75,6 +80,8 @@ private:
     bool data_in_square_brackets = false;
 
     bool allow_new_rows = true;
+
+    bool yield_strings;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
index 910a9710de3..069499d99c1 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
@@ -8,8 +8,13 @@ namespace DB
 {
 
 
-JSONEachRowRowOutputFormat::JSONEachRowRowOutputFormat(WriteBuffer & out_, const Block & header_, FormatFactory::WriteCallback callback, const FormatSettings & settings_)
-    : IRowOutputFormat(header_, out_, callback), settings(settings_)
+JSONEachRowRowOutputFormat::JSONEachRowRowOutputFormat(
+    WriteBuffer & out_,
+    const Block & header_,
+    FormatFactory::WriteCallback callback,
+    const FormatSettings & settings_,
+    bool yield_strings_)
+    : IRowOutputFormat(header_, out_, callback), settings(settings_), yield_strings(yield_strings_)
 {
     const auto & sample = getPort(PortKind::Main).getHeader();
     size_t columns = sample.columns();
@@ -27,7 +32,17 @@ void JSONEachRowRowOutputFormat::writeField(const IColumn & column, const IDataT
 {
     writeString(fields[field_number], out);
     writeChar(':', out);
-    type.serializeAsTextJSON(column, row_num, out, settings);
+
+    if (yield_strings)
+    {
+        WriteBufferFromOwnString buf;
+
+        type.serializeAsText(column, row_num, buf, settings);
+        writeJSONString(buf.str(), out, settings);
+    }
+    else
+        type.serializeAsTextJSON(column, row_num, out, settings);
+
     ++field_number;
 }
 
@@ -59,7 +74,16 @@ void registerOutputFormatProcessorJSONEachRow(FormatFactory & factory)
         FormatFactory::WriteCallback callback,
         const FormatSettings & format_settings)
     {
-        return std::make_shared<JSONEachRowRowOutputFormat>(buf, sample, callback, format_settings);
+        return std::make_shared<JSONEachRowRowOutputFormat>(buf, sample, callback, format_settings, false);
+    });
+
+    factory.registerOutputFormatProcessor("JSONStringsEachRow", [](
+        WriteBuffer & buf,
+        const Block & sample,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & format_settings)
+    {
+        return std::make_shared<JSONEachRowRowOutputFormat>(buf, sample, callback, format_settings, true);
     });
 }
 
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
index d2b6937cd01..5346a1ab19f 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
@@ -15,7 +15,12 @@ namespace DB
 class JSONEachRowRowOutputFormat : public IRowOutputFormat
 {
 public:
-    JSONEachRowRowOutputFormat(WriteBuffer & out_, const Block & header_, FormatFactory::WriteCallback callback, const FormatSettings & settings_);
+    JSONEachRowRowOutputFormat(
+        WriteBuffer & out_,
+        const Block & header_,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & settings_,
+        bool yield_strings_);
 
     String getName() const override { return "JSONEachRowRowOutputFormat"; }
 
@@ -35,6 +40,9 @@ private:
     Names fields;
 
     FormatSettings settings;
+
+protected:
+    bool yield_strings;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/JSONEachRowWithProgressRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowWithProgressRowOutputFormat.cpp
index a611b5a129b..35720df9672 100644
--- a/src/Processors/Formats/Impl/JSONEachRowWithProgressRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowWithProgressRowOutputFormat.cpp
@@ -36,7 +36,16 @@ void registerOutputFormatProcessorJSONEachRowWithProgress(FormatFactory & factor
             FormatFactory::WriteCallback callback,
             const FormatSettings & format_settings)
     {
-        return std::make_shared<JSONEachRowWithProgressRowOutputFormat>(buf, sample, callback, format_settings);
+        return std::make_shared<JSONEachRowWithProgressRowOutputFormat>(buf, sample, callback, format_settings, false);
+    });
+
+    factory.registerOutputFormatProcessor("JSONStringsEachRowWithProgress", [](
+            WriteBuffer & buf,
+            const Block & sample,
+            FormatFactory::WriteCallback callback,
+            const FormatSettings & format_settings)
+    {
+        return std::make_shared<JSONEachRowWithProgressRowOutputFormat>(buf, sample, callback, format_settings, true);
     });
 }
 
diff --git a/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
index b3255f2894e..7dd7eb9953a 100644
--- a/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
@@ -7,8 +7,13 @@
 namespace DB
 {
 
-JSONRowOutputFormat::JSONRowOutputFormat(WriteBuffer & out_, const Block & header, FormatFactory::WriteCallback callback, const FormatSettings & settings_)
-    : IRowOutputFormat(header, out_, callback), settings(settings_)
+JSONRowOutputFormat::JSONRowOutputFormat(
+    WriteBuffer & out_,
+    const Block & header,
+    FormatFactory::WriteCallback callback,
+    const FormatSettings & settings_,
+    bool yield_strings_)
+    : IRowOutputFormat(header, out_, callback), settings(settings_), yield_strings(yield_strings_)
 {
     const auto & sample = getPort(PortKind::Main).getHeader();
     NamesAndTypesList columns(sample.getNamesAndTypesList());
@@ -71,7 +76,17 @@ void JSONRowOutputFormat::writeField(const IColumn & column, const IDataType & t
     writeCString("\t\t\t", *ostr);
     writeString(fields[field_number].name, *ostr);
     writeCString(": ", *ostr);
-    type.serializeAsTextJSON(column, row_num, *ostr, settings);
+
+    if (yield_strings)
+    {
+        WriteBufferFromOwnString buf;
+
+        type.serializeAsText(column, row_num, buf, settings);
+        writeJSONString(buf.str(), *ostr, settings);
+    }
+    else
+        type.serializeAsTextJSON(column, row_num, *ostr, settings);
+
     ++field_number;
 }
 
@@ -80,7 +95,17 @@ void JSONRowOutputFormat::writeTotalsField(const IColumn & column, const IDataTy
     writeCString("\t\t", *ostr);
     writeString(fields[field_number].name, *ostr);
     writeCString(": ", *ostr);
-    type.serializeAsTextJSON(column, row_num, *ostr, settings);
+
+    if (yield_strings)
+    {
+        WriteBufferFromOwnString buf;
+
+        type.serializeAsText(column, row_num, buf, settings);
+        writeJSONString(buf.str(), *ostr, settings);
+    }
+    else
+        type.serializeAsTextJSON(column, row_num, *ostr, settings);
+
     ++field_number;
 }
 
@@ -249,7 +274,16 @@ void registerOutputFormatProcessorJSON(FormatFactory & factory)
         FormatFactory::WriteCallback callback,
         const FormatSettings & format_settings)
     {
-        return std::make_shared<JSONRowOutputFormat>(buf, sample, callback, format_settings);
+        return std::make_shared<JSONRowOutputFormat>(buf, sample, callback, format_settings, false);
+    });
+
+    factory.registerOutputFormatProcessor("JSONStrings", [](
+        WriteBuffer & buf,
+        const Block & sample,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & format_settings)
+    {
+        return std::make_shared<JSONRowOutputFormat>(buf, sample, callback, format_settings, true);
     });
 }
 
diff --git a/src/Processors/Formats/Impl/JSONRowOutputFormat.h b/src/Processors/Formats/Impl/JSONRowOutputFormat.h
index f9aea3a3e8b..4e9cceb717e 100644
--- a/src/Processors/Formats/Impl/JSONRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONRowOutputFormat.h
@@ -16,7 +16,12 @@ namespace DB
 class JSONRowOutputFormat : public IRowOutputFormat
 {
 public:
-    JSONRowOutputFormat(WriteBuffer & out_, const Block & header, FormatFactory::WriteCallback callback, const FormatSettings & settings_);
+    JSONRowOutputFormat(
+        WriteBuffer & out_,
+        const Block & header,
+        FormatFactory::WriteCallback callback,
+        const FormatSettings & settings_,
+        bool yield_strings_);
 
     String getName() const override { return "JSONRowOutputFormat"; }
 
@@ -78,6 +83,8 @@ protected:
     Progress progress;
     Stopwatch watch;
     FormatSettings settings;
+
+    bool yield_strings;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.cpp
deleted file mode 100644
index fff44a204fb..00000000000
--- a/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.cpp
+++ /dev/null
@@ -1,245 +0,0 @@
-#include <IO/ReadHelpers.h>
-#include <IO/ReadBufferFromString.h>
-
-#include <Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h>
-#include <Formats/FormatFactory.h>
-#include <DataTypes/NestedUtils.h>
-#include <DataTypes/DataTypeNullable.h>
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int INCORRECT_DATA;
-    extern const int CANNOT_READ_ALL_DATA;
-}
-
-
-JSONStringsEachRowRowInputFormat::JSONStringsEachRowRowInputFormat(ReadBuffer & in_,
-        const Block & header_,
-        Params params_,
-        const FormatSettings & format_settings_,
-        bool with_names_)
-        : IRowInputFormat(header_, in_, std::move(params_)), format_settings(format_settings_), with_names(with_names_)
-{
-    const auto & sample = getPort().getHeader();
-    size_t num_columns = sample.columns();
-
-    data_types.resize(num_columns);
-    column_indexes_by_names.reserve(num_columns);
-
-    for (size_t i = 0; i < num_columns; ++i)
-    {
-        const auto & column_info = sample.getByPosition(i);
-
-        data_types[i] = column_info.type;
-        column_indexes_by_names.emplace(column_info.name, i);
-    }
-}
-
-void JSONStringsEachRowRowInputFormat::resetParser()
-{
-    IRowInputFormat::resetParser();
-    column_indexes_for_input_fields.clear();
-    not_seen_columns.clear();
-}
-
-void JSONStringsEachRowRowInputFormat::readPrefix()
-{
-    /// In this format, BOM at beginning of stream cannot be confused with value, so it is safe to skip it.
-    skipBOMIfExists(in);
-
-    if (with_names)
-    {
-        size_t num_columns = getPort().getHeader().columns();
-        read_columns.assign(num_columns, false);
-
-        assertChar('[', in);
-        do
-        {
-            skipWhitespaceIfAny(in);
-            String column_name;
-            readJSONString(column_name, in);
-            addInputColumn(column_name);
-            skipWhitespaceIfAny(in);
-        }
-        while (checkChar(',', in));
-        assertChar(']', in);
-        skipEndOfLine();
-
-        /// Type checking
-        assertChar('[', in);
-        for (size_t i = 0; i < column_indexes_for_input_fields.size(); ++i)
-        {
-            skipWhitespaceIfAny(in);
-            String data_type;
-            readJSONString(data_type, in);
-
-            if (column_indexes_for_input_fields[i] &&
-                data_types[*column_indexes_for_input_fields[i]]->getName() != data_type)
-            {
-                throw Exception(
-                        "Type of '" + getPort().getHeader().getByPosition(*column_indexes_for_input_fields[i]).name
-                        + "' must be " + data_types[*column_indexes_for_input_fields[i]]->getName() +
-                        ", not " + data_type,
-                        ErrorCodes::INCORRECT_DATA
-                );
-            }
-
-            if (i != column_indexes_for_input_fields.size() - 1)
-                assertChar(',', in);
-            skipWhitespaceIfAny(in);
-        }
-        assertChar(']', in);
-    }
-    else
-    {
-        size_t num_columns = getPort().getHeader().columns();
-        read_columns.assign(num_columns, true);
-        column_indexes_for_input_fields.resize(num_columns);
-
-        for (size_t i = 0; i < num_columns; ++i)
-        {
-            column_indexes_for_input_fields[i] = i;
-        }
-    }
-
-    for (size_t i = 0; i < read_columns.size(); ++i)
-    {
-        if (!read_columns[i])
-        {
-            not_seen_columns.emplace_back(i);
-        }
-    }
-}
-
-void JSONStringsEachRowRowInputFormat::addInputColumn(const String & column_name)
-{
-    names_of_columns.emplace_back(column_name);
-
-    const auto column_it = column_indexes_by_names.find(column_name);
-    if (column_it == column_indexes_by_names.end())
-    {
-        if (format_settings.skip_unknown_fields)
-        {
-            column_indexes_for_input_fields.push_back(std::nullopt);
-            return;
-        }
-
-        throw Exception(
-                "Unknown field found in JSONStringsEachRow header: '" + column_name + "' " +
-                "at position " + std::to_string(column_indexes_for_input_fields.size()) +
-                "\nSet the 'input_format_skip_unknown_fields' parameter explicitly to ignore and proceed",
-                ErrorCodes::INCORRECT_DATA
-        );
-    }
-
-    const auto column_index = column_it->second;
-
-    if (read_columns[column_index])
-        throw Exception("Duplicate field found while parsing JSONStringsEachRow header: " + column_name, ErrorCodes::INCORRECT_DATA);
-
-    read_columns[column_index] = true;
-    column_indexes_for_input_fields.emplace_back(column_index);
-}
-
-bool JSONStringsEachRowRowInputFormat::readRow(DB::MutableColumns &columns, DB::RowReadExtension &ext)
-{
-    skipEndOfLine();
-
-    if (in.eof())
-        return false;
-
-    size_t num_columns = columns.size();
-
-    read_columns.assign(num_columns, false);
-
-    assertChar('[', in);
-    for (size_t file_column = 0; file_column < column_indexes_for_input_fields.size(); ++file_column)
-    {
-        const auto & table_column = column_indexes_for_input_fields[file_column];
-        if (table_column)
-        {
-            readField(*table_column, columns);
-        }
-        else
-        {
-            skipJSONField(in, StringRef(names_of_columns[file_column]));
-        }
-
-        skipWhitespaceIfAny(in);
-        if (in.eof())
-            throw Exception("Unexpected end of stream while parsing JSONStringsEachRow format", ErrorCodes::CANNOT_READ_ALL_DATA);
-        if (file_column + 1 != column_indexes_for_input_fields.size())
-        {
-            assertChar(',', in);
-            skipWhitespaceIfAny(in);
-        }
-    }
-    assertChar(']', in);
-
-    for (const auto & name : not_seen_columns)
-        columns[name]->insertDefault();
-
-    ext.read_columns = read_columns;
-    return true;
-}
-
-void JSONStringsEachRowRowInputFormat::skipEndOfLine()
-{
-    skipWhitespaceIfAny(in);
-    if (!in.eof() && (*in.position() == ',' || *in.position() == ';'))
-        ++in.position();
-
-    skipWhitespaceIfAny(in);
-}
-
-void JSONStringsEachRowRowInputFormat::readField(size_t index, MutableColumns & columns)
-{
-    try
-    {
-        read_columns[index] = true;
-        const auto & type = data_types[index];
-
-        String str;
-        readJSONString(str, in);
-
-        ReadBufferFromString buf(str);
-
-        type->deserializeAsWholeText(*columns[index], buf, format_settings);
-    }
-    catch (Exception & e)
-    {
-        e.addMessage("(while read the value of key " +  getPort().getHeader().getByPosition(index).name + ")");
-        throw;
-    }
-}
-
-void JSONStringsEachRowRowInputFormat::syncAfterError()
-{
-    skipToUnescapedNextLineOrEOF(in);
-}
-
-void registerInputFormatProcessorJSONStringsEachRow(FormatFactory & factory)
-{
-    factory.registerInputFormatProcessor("JSONStringsEachRow", [](
-            ReadBuffer & buf,
-            const Block & sample,
-            IRowInputFormat::Params params,
-            const FormatSettings & settings)
-    {
-        return std::make_shared<JSONStringsEachRowRowInputFormat>(buf, sample, std::move(params), settings, false);
-    });
-
-    factory.registerInputFormatProcessor("JSONStringsEachRowWithNamesAndTypes", [](
-            ReadBuffer & buf,
-            const Block & sample,
-            IRowInputFormat::Params params,
-            const FormatSettings & settings)
-    {
-        return std::make_shared<JSONStringsEachRowRowInputFormat>(buf, sample, std::move(params), settings, true);
-    });
-}
-
-}
diff --git a/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h b/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h
deleted file mode 100644
index ec0a0f7bad9..00000000000
--- a/src/Processors/Formats/Impl/JSONStringsEachRowRowInputFormat.h
+++ /dev/null
@@ -1,54 +0,0 @@
-#pragma once
-
-#pragma once
-
-#include <Core/Block.h>
-#include <Processors/Formats/IRowInputFormat.h>
-#include <Formats/FormatSettings.h>
-#include <Common/HashTable/HashMap.h>
-
-namespace DB
-{
-
-class ReadBuffer;
-
-/** A stream for reading data in JSONStringsEachRow and JSONStringsEachRowWithNamesAndTypes formats
-*/
-class JSONStringsEachRowRowInputFormat : public IRowInputFormat
-{
-public:
-    JSONStringsEachRowRowInputFormat(ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_, bool with_names_);
-
-    String getName() const override { return "JSONStringsEachRowRowInputFormat"; }
-
-
-    void readPrefix() override;
-    bool readRow(MutableColumns & columns, RowReadExtension & ext) override;
-    bool allowSyncAfterError() const override { return true; }
-    void syncAfterError() override;
-    void resetParser() override;
-
-private:
-    void addInputColumn(const String & column_name);
-    void skipEndOfLine();
-    void readField(size_t index, MutableColumns & columns);
-
-    const FormatSettings format_settings;
-
-    using IndexesMap = std::unordered_map<String, size_t>;
-    IndexesMap column_indexes_by_names;
-
-    using OptionalIndexes = std::vector<std::optional<size_t>>;
-    OptionalIndexes column_indexes_for_input_fields;
-
-    DataTypes data_types;
-    std::vector<UInt8> read_columns;
-    std::vector<size_t> not_seen_columns;
-
-    /// This is for the correct exceptions in skipping unknown fields.
-    std::vector<String> names_of_columns;
-
-    bool with_names;
-};
-
-}
diff --git a/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp
deleted file mode 100644
index 75007ea236e..00000000000
--- a/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp
+++ /dev/null
@@ -1,117 +0,0 @@
-#include <IO/WriteHelpers.h>
-#include <IO/WriteBufferValidUTF8.h>
-#include <Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h>
-#include <Formats/FormatFactory.h>
-
-
-namespace DB
-{
-
-
-JSONStringsEachRowRowOutputFormat::JSONStringsEachRowRowOutputFormat(WriteBuffer & out_,
-        const Block & header_,
-        FormatFactory::WriteCallback callback,
-        const FormatSettings & settings_,
-        bool with_names_)
-        : IRowOutputFormat(header_, out_, callback), settings(settings_), with_names(with_names_)
-{
-            const auto & sample = getPort(PortKind::Main).getHeader();
-            NamesAndTypesList columns(sample.getNamesAndTypesList());
-            fields.assign(columns.begin(), columns.end());
-}
-
-
-void JSONStringsEachRowRowOutputFormat::writeField(const IColumn & column, const IDataType & type, size_t row_num)
-{
-    WriteBufferFromOwnString buf;
-
-    type.serializeAsText(column, row_num, buf, settings);
-    writeJSONString(buf.str(), out, settings);
-}
-
-
-void JSONStringsEachRowRowOutputFormat::writeFieldDelimiter()
-{
-    writeCString(", ", out);
-}
-
-
-void JSONStringsEachRowRowOutputFormat::writeRowStartDelimiter()
-{
-    writeChar('[', out);
-}
-
-
-void JSONStringsEachRowRowOutputFormat::writeRowEndDelimiter()
-{
-    writeCString("]\n", out);
-}
-
-void JSONStringsEachRowRowOutputFormat::writeTotals(const Columns & columns, size_t row_num)
-{
-    writeChar('\n', out);
-    size_t num_columns = columns.size();
-    writeChar('[', out);
-    for (size_t i = 0; i < num_columns; ++i)
-    {
-        if (i != 0)
-            JSONStringsEachRowRowOutputFormat::writeFieldDelimiter();
-
-        JSONStringsEachRowRowOutputFormat::writeField(*columns[i], *types[i], row_num);
-    }
-    writeCString("]\n", out);
-}
-
-void JSONStringsEachRowRowOutputFormat::writePrefix()
-{
-    if (with_names)
-    {
-        writeChar('[', out);
-        for (size_t i = 0; i < fields.size(); ++i)
-        {
-            writeChar('\"', out);
-            writeString(fields[i].name, out);
-            writeChar('\"', out);
-            if (i != fields.size() - 1)
-                writeCString(", ", out);
-        }
-        writeCString("]\n[", out);
-        for (size_t i = 0; i < fields.size(); ++i)
-        {
-            writeJSONString(fields[i].type->getName(), out, settings);
-            if (i != fields.size() - 1)
-                writeCString(", ", out);
-        }
-        writeCString("]\n", out);
-    }
-}
-
-void JSONStringsEachRowRowOutputFormat::consumeTotals(DB::Chunk chunk)
-{
-    if (with_names)
-        IRowOutputFormat::consumeTotals(std::move(chunk));
-}
-
-void registerOutputFormatProcessorJSONStringsEachRow(FormatFactory & factory)
-{
-    factory.registerOutputFormatProcessor("JSONStringsEachRow", [](
-            WriteBuffer & buf,
-            const Block & sample,
-            FormatFactory::WriteCallback callback,
-            const FormatSettings & format_settings)
-    {
-        return std::make_shared<JSONStringsEachRowRowOutputFormat>(buf, sample, callback, format_settings, false);
-    });
-
-    factory.registerOutputFormatProcessor("JSONStringsEachRowWithNamesAndTypes", [](
-            WriteBuffer &buf,
-            const Block &sample,
-            FormatFactory::WriteCallback callback,
-            const FormatSettings &format_settings)
-    {
-        return std::make_shared<JSONStringsEachRowRowOutputFormat>(buf, sample, callback, format_settings, true);
-    });
-}
-
-
-}
diff --git a/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h
deleted file mode 100644
index 1d43a333da1..00000000000
--- a/src/Processors/Formats/Impl/JSONStringsEachRowRowOutputFormat.h
+++ /dev/null
@@ -1,45 +0,0 @@
-#pragma once
-
-#include <Core/Block.h>
-#include <IO/WriteBuffer.h>
-#include <Processors/Formats/IRowOutputFormat.h>
-#include <Formats/FormatSettings.h>
-
-
-namespace DB
-{
-
-/** The stream for outputting data in JSON format, by object per line.
-  * Does not validate UTF-8.
-  */
-class JSONStringsEachRowRowOutputFormat : public IRowOutputFormat
-{
-public:
-    JSONStringsEachRowRowOutputFormat(WriteBuffer & out_, const Block & header_, FormatFactory::WriteCallback callback, const FormatSettings & settings_, bool with_names);
-
-    String getName() const override { return "JSONStringsEachRowRowOutputFormat"; }
-
-    void writePrefix() override;
-
-    void writeBeforeTotals() override {}
-    void writeTotals(const Columns & columns, size_t row_num) override;
-    void writeAfterTotals() override {}
-
-    void writeField(const IColumn & column, const IDataType & type, size_t row_num) override;
-    void writeFieldDelimiter() override;
-    void writeRowStartDelimiter() override;
-    void writeRowEndDelimiter() override;
-
-protected:
-    void consumeTotals(Chunk) override;
-    /// No extremes.
-    void consumeExtremes(Chunk) override {}
-
-private:
-    FormatSettings settings;
-
-    NamesAndTypes fields;
-
-    bool with_names;
-};
-}
diff --git a/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.cpp
deleted file mode 100644
index 6ccb315f73f..00000000000
--- a/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.cpp
+++ /dev/null
@@ -1,93 +0,0 @@
-#include <Processors/Formats/Impl/JSONStringsRowOutputFormat.h>
-#include <Formats/FormatFactory.h>
-
-#include <IO/WriteHelpers.h>
-
-
-namespace DB
-{
-
-JSONStringsRowOutputFormat::JSONStringsRowOutputFormat(
-    WriteBuffer & out_, const Block & header, FormatFactory::WriteCallback callback, const FormatSettings & settings_)
-    : JSONRowOutputFormat(out_, header, callback, settings_)
-{
-}
-
-
-void JSONStringsRowOutputFormat::writeField(const IColumn & column, const IDataType & type, size_t row_num)
-{
-    WriteBufferFromOwnString buf;
-
-    type.serializeAsText(column, row_num, buf, settings);
-    writeJSONString(buf.str(), *ostr, settings);
-    ++field_number;
-}
-
-
-void JSONStringsRowOutputFormat::writeFieldDelimiter()
-{
-    writeCString(", ", *ostr);
-}
-
-void JSONStringsRowOutputFormat::writeTotalsFieldDelimiter()
-{
-    writeCString(",", *ostr);
-}
-
-
-void JSONStringsRowOutputFormat::writeRowStartDelimiter()
-{
-    writeCString("\t\t[", *ostr);
-}
-
-
-void JSONStringsRowOutputFormat::writeRowEndDelimiter()
-{
-    writeChar(']', *ostr);
-    field_number = 0;
-    ++row_count;
-}
-
-void JSONStringsRowOutputFormat::writeBeforeTotals()
-{
-    writeCString(",\n", *ostr);
-    writeChar('\n', *ostr);
-    writeCString("\t\"totals\": [", *ostr);
-}
-
-void JSONStringsRowOutputFormat::writeAfterTotals()
-{
-    writeChar(']', *ostr);
-}
-
-void JSONStringsRowOutputFormat::writeExtremesElement(const char * title, const Columns & columns, size_t row_num)
-{
-    writeCString("\t\t\"", *ostr);
-    writeCString(title, *ostr);
-    writeCString("\": [", *ostr);
-
-    size_t extremes_columns = columns.size();
-    for (size_t i = 0; i < extremes_columns; ++i)
-    {
-        if (i != 0)
-            writeTotalsFieldDelimiter();
-
-        writeField(*columns[i], *types[i], row_num);
-    }
-
-    writeChar(']', *ostr);
-}
-
-void registerOutputFormatProcessorJSONStrings(FormatFactory & factory)
-{
-    factory.registerOutputFormatProcessor("JSONStrings", [](
-        WriteBuffer & buf,
-        const Block & sample,
-        FormatFactory::WriteCallback callback,
-        const FormatSettings & format_settings)
-    {
-        return std::make_shared<JSONStringsRowOutputFormat>(buf, sample, callback, format_settings);
-    });
-}
-
-}
diff --git a/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.h b/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.h
deleted file mode 100644
index b221bc9ee36..00000000000
--- a/src/Processors/Formats/Impl/JSONStringsRowOutputFormat.h
+++ /dev/null
@@ -1,43 +0,0 @@
-#pragma once
-
-#include <Core/Block.h>
-#include <IO/WriteBuffer.h>
-#include <IO/WriteBufferValidUTF8.h>
-#include <Processors/Formats/Impl/JSONRowOutputFormat.h>
-
-
-namespace DB
-{
-
-struct FormatSettings;
-
-/** The stream for outputting data in the JSONStrings format.
-  */
-class JSONStringsRowOutputFormat : public JSONRowOutputFormat
-{
-public:
-    JSONStringsRowOutputFormat(WriteBuffer & out_, const Block & header, FormatFactory::WriteCallback callback, const FormatSettings & settings_);
-
-    String getName() const override { return "JSONStringsRowOutputFormat"; }
-
-    void writeField(const IColumn & column, const IDataType & type, size_t row_num) override;
-    void writeFieldDelimiter() override;
-    void writeRowStartDelimiter() override;
-    void writeRowEndDelimiter() override;
-
-    void writeBeforeTotals() override;
-    void writeAfterTotals() override;
-
-protected:
-    void writeExtremesElement(const char * title, const Columns & columns, size_t row_num) override;
-
-    void writeTotalsField(const IColumn & column, const IDataType & type, size_t row_num) override
-    {
-        return writeField(column, type, row_num);
-    }
-
-    void writeTotalsFieldDelimiter() override;
-
-};
-
-}
diff --git a/tests/queries/0_stateless/01446_JSONStringsEachRow.sql b/tests/queries/0_stateless/01446_JSONStringsEachRow.sql
deleted file mode 100644
index f461b217fe4..00000000000
--- a/tests/queries/0_stateless/01446_JSONStringsEachRow.sql
+++ /dev/null
@@ -1,63 +0,0 @@
-DROP TABLE IF EXISTS test_table;
-DROP TABLE IF EXISTS test_table_2;
-SELECT 1;
-/* Check JSONStringsEachRow Output */
-CREATE TABLE test_table (value UInt8, name String) ENGINE = MergeTree() ORDER BY value;
-INSERT INTO test_table VALUES (1, 'a'), (2, 'b'), (3, 'c');
-SELECT * FROM test_table FORMAT JSONStringsEachRow;
-SELECT 2;
-/* Check Totals */
-SELECT name, count() AS c FROM test_table GROUP BY name WITH TOTALS ORDER BY name FORMAT JSONStringsEachRow;
-SELECT 3;
-/* Check JSONStringsEachRowWithNamesAndTypes Output */
-SELECT * FROM test_table FORMAT JSONStringsEachRowWithNamesAndTypes;
-SELECT 4;
-/* Check Totals */
-SELECT name, count() AS c FROM test_table GROUP BY name WITH TOTALS ORDER BY name FORMAT JSONStringsEachRowWithNamesAndTypes;
-DROP TABLE IF EXISTS test_table;
-SELECT 5;
-/* Check JSONStringsEachRow Input */
-CREATE TABLE test_table (v1 String, v2 UInt8, v3 DEFAULT v2 * 16, v4 UInt8 DEFAULT 8) ENGINE = MergeTree() ORDER BY v2;
-INSERT INTO test_table FORMAT JSONStringsEachRow ["first", "1", "2", "NULL"] ["second", "2", "null", "6"];
-SELECT * FROM test_table FORMAT JSONStringsEachRow;
-TRUNCATE TABLE test_table;
-SELECT 6;
-/* Check input_format_null_as_default = 1 */
-SET input_format_null_as_default = 1;
-INSERT INTO test_table FORMAT JSONStringsEachRow ["first", "1", "2", "ᴺᵁᴸᴸ"] ["second", "2", "null", "6"];
-SELECT * FROM test_table FORMAT JSONStringsEachRow;
-TRUNCATE TABLE test_table;
-SELECT 7;
-/* Check Nested */
-CREATE TABLE test_table_2 (v1 UInt8, n Nested(id UInt8, name String)) ENGINE = MergeTree() ORDER BY v1;
-INSERT INTO test_table_2 FORMAT JSONStringsEachRow ["16", "[15, 16, 17]", "['first', 'second', 'third']"];
-SELECT * FROM test_table_2 FORMAT JSONStringsEachRow;
-TRUNCATE TABLE test_table_2;
-SELECT 8;
-/* Check JSONStringsEachRowWithNamesAndTypes Output */
-SET input_format_null_as_default = 0;
-INSERT INTO test_table FORMAT JSONStringsEachRowWithNamesAndTypes ["v1", "v2", "v3", "v4"]["String","UInt8","UInt16","UInt8"]["first", "1", "2", "null"]["second", "2", "null", "6"];
-SELECT * FROM test_table FORMAT JSONStringsEachRow;
-TRUNCATE TABLE test_table;
-SELECT 9;
-/* Check input_format_null_as_default = 1 */
-SET input_format_null_as_default = 1;
-INSERT INTO test_table FORMAT JSONStringsEachRowWithNamesAndTypes ["v1", "v2", "v3", "v4"]["String","UInt8","UInt16","UInt8"]["first", "1", "2", "null"] ["second", "2", "null", "6"];
-SELECT * FROM test_table FORMAT JSONStringsEachRow;
-SELECT 10;
-/* Check Header */
-TRUNCATE TABLE test_table;
-SET input_format_skip_unknown_fields = 1;
-INSERT INTO test_table FORMAT JSONStringsEachRowWithNamesAndTypes ["v1", "v2", "invalid_column"]["String", "UInt8", "UInt8"]["first", "1", "32"]["second", "2", "64"];
-SELECT * FROM test_table FORMAT JSONStringsEachRow;
-SELECT 11;
-TRUNCATE TABLE test_table;
-INSERT INTO test_table FORMAT JSONStringsEachRowWithNamesAndTypes ["v4", "v2", "v3"]["UInt8", "UInt8", "UInt16"]["1", "2", "3"]
-SELECT * FROM test_table FORMAT JSONStringsEachRowWithNamesAndTypes;
-SELECT 12;
-/* Check Nested */
-INSERT INTO test_table_2 FORMAT JSONStringsEachRowWithNamesAndTypes ["v1", "n.id", "n.name"]["UInt8", "Array(UInt8)", "Array(String)"]["16", "[15, 16, 17]", "['first', 'second', 'third']"];
-SELECT * FROM test_table_2 FORMAT JSONStringsEachRowWithNamesAndTypes;
-
-DROP TABLE IF EXISTS test_table;
-DROP TABLE IF EXISTS test_table_2;
diff --git a/tests/queries/0_stateless/01446_json_strings_each_row.reference b/tests/queries/0_stateless/01446_json_strings_each_row.reference
new file mode 100644
index 00000000000..84d41095b77
--- /dev/null
+++ b/tests/queries/0_stateless/01446_json_strings_each_row.reference
@@ -0,0 +1,22 @@
+1
+{"value":"1","name":"a"}
+{"value":"2","name":"b"}
+{"value":"3","name":"c"}
+2
+{"name":"a","c":"1"}
+{"name":"b","c":"1"}
+{"name":"c","c":"1"}
+3
+{"row":{"a":"1"}}
+{"progress":{"read_rows":"1","read_bytes":"1","written_rows":"0","written_bytes":"0","total_rows_to_read":"0"}}
+4
+{"row":{"a":"1"}}
+{"progress":{"read_rows":"1","read_bytes":"1","written_rows":"0","written_bytes":"0","total_rows_to_read":"0"}}
+5
+{"v1":"first","v2":"1","v3":"2","v4":"0"}
+{"v1":"second","v2":"2","v3":"0","v4":"6"}
+6
+{"v1":"first","v2":"1","v3":"2","v4":"0"}
+{"v1":"second","v2":"2","v3":"0","v4":"6"}
+7
+{"v1":"16","n.id":"[15,16,17]","n.name":"['first','second','third']"}
diff --git a/tests/queries/0_stateless/01446_json_strings_each_row.sql b/tests/queries/0_stateless/01446_json_strings_each_row.sql
new file mode 100644
index 00000000000..98bd3e3ab47
--- /dev/null
+++ b/tests/queries/0_stateless/01446_json_strings_each_row.sql
@@ -0,0 +1,38 @@
+DROP TABLE IF EXISTS test_table;
+DROP TABLE IF EXISTS test_table_2;
+SELECT 1;
+/* Check JSONStringsEachRow Output */
+CREATE TABLE test_table (value UInt8, name String) ENGINE = MergeTree() ORDER BY value;
+INSERT INTO test_table VALUES (1, 'a'), (2, 'b'), (3, 'c');
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+SELECT 2;
+/* Check Totals */
+SELECT name, count() AS c FROM test_table GROUP BY name WITH TOTALS ORDER BY name FORMAT JSONStringsEachRow;
+SELECT 3;
+/* Check JSONStringsEachRowWithProgress Output */
+SELECT 1 as a FROM system.one FORMAT JSONStringsEachRowWithProgress;
+SELECT 4;
+/* Check Totals */
+SELECT 1 as a FROM system.one GROUP BY a WITH TOTALS ORDER BY a FORMAT JSONStringsEachRowWithProgress;
+DROP TABLE IF EXISTS test_table;
+SELECT 5;
+/* Check JSONStringsEachRow Input */
+CREATE TABLE test_table (v1 String, v2 UInt8, v3 DEFAULT v2 * 16, v4 UInt8 DEFAULT 8) ENGINE = MergeTree() ORDER BY v2;
+INSERT INTO test_table FORMAT JSONStringsEachRow {"v1": "first", "v2": "1", "v3": "2", "v4": "NULL"} {"v1": "second", "v2": "2", "v3": "null", "v4": "6"};
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+TRUNCATE TABLE test_table;
+SELECT 6;
+/* Check input_format_null_as_default = 1 */
+SET input_format_null_as_default = 1;
+INSERT INTO test_table FORMAT JSONStringsEachRow {"v1": "first", "v2": "1", "v3": "2", "v4": "ᴺᵁᴸᴸ"} {"v1": "second", "v2": "2", "v3": "null", "v4": "6"};
+SELECT * FROM test_table FORMAT JSONStringsEachRow;
+TRUNCATE TABLE test_table;
+SELECT 7;
+/* Check Nested */
+CREATE TABLE test_table_2 (v1 UInt8, n Nested(id UInt8, name String)) ENGINE = MergeTree() ORDER BY v1;
+INSERT INTO test_table_2 FORMAT JSONStringsEachRow {"v1": "16", "n.id": "[15, 16, 17]", "n.name": "['first', 'second', 'third']"};
+SELECT * FROM test_table_2 FORMAT JSONStringsEachRow;
+TRUNCATE TABLE test_table_2;
+
+DROP TABLE IF EXISTS test_table;
+DROP TABLE IF EXISTS test_table_2;
diff --git a/tests/queries/0_stateless/01447_json_strings.reference b/tests/queries/0_stateless/01447_json_strings.reference
new file mode 100644
index 00000000000..ab88e2f3696
--- /dev/null
+++ b/tests/queries/0_stateless/01447_json_strings.reference
@@ -0,0 +1,43 @@
+{
+	"meta":
+	[
+		{
+			"name": "1",
+			"type": "UInt8"
+		},
+		{
+			"name": "'a'",
+			"type": "String"
+		},
+		{
+			"name": "[1, 2, 3]",
+			"type": "Array(UInt8)"
+		},
+		{
+			"name": "tuple(1, 'a')",
+			"type": "Tuple(UInt8, String)"
+		},
+		{
+			"name": "NULL",
+			"type": "Nullable(Nothing)"
+		},
+		{
+			"name": "nan",
+			"type": "Float64"
+		}
+	],
+
+	"data":
+	[
+		{
+			"1": "1",
+			"'a'": "a",
+			"[1, 2, 3]": "[1,2,3]",
+			"tuple(1, 'a')": "(1,'a')",
+			"NULL": "ᴺᵁᴸᴸ",
+			"nan": "nan"
+		}
+	],
+
+	"rows": 1
+}
diff --git a/tests/queries/0_stateless/01447_JSONStrings.sql b/tests/queries/0_stateless/01447_json_strings.sql
similarity index 100%
rename from tests/queries/0_stateless/01447_JSONStrings.sql
rename to tests/queries/0_stateless/01447_json_strings.sql
diff --git a/tests/queries/0_stateless/01446_JSONStringsEachRow.reference b/tests/queries/0_stateless/01448_json_compact_strings_each_row.reference
similarity index 100%
rename from tests/queries/0_stateless/01446_JSONStringsEachRow.reference
rename to tests/queries/0_stateless/01448_json_compact_strings_each_row.reference
diff --git a/tests/queries/0_stateless/01448_json_compact_strings_each_row.sql b/tests/queries/0_stateless/01448_json_compact_strings_each_row.sql
new file mode 100644
index 00000000000..c271de88434
--- /dev/null
+++ b/tests/queries/0_stateless/01448_json_compact_strings_each_row.sql
@@ -0,0 +1,63 @@
+DROP TABLE IF EXISTS test_table;
+DROP TABLE IF EXISTS test_table_2;
+SELECT 1;
+/* Check JSONCompactStringsEachRow Output */
+CREATE TABLE test_table (value UInt8, name String) ENGINE = MergeTree() ORDER BY value;
+INSERT INTO test_table VALUES (1, 'a'), (2, 'b'), (3, 'c');
+SELECT * FROM test_table FORMAT JSONCompactStringsEachRow;
+SELECT 2;
+/* Check Totals */
+SELECT name, count() AS c FROM test_table GROUP BY name WITH TOTALS ORDER BY name FORMAT JSONCompactStringsEachRow;
+SELECT 3;
+/* Check JSONCompactStringsEachRowWithNamesAndTypes Output */
+SELECT * FROM test_table FORMAT JSONCompactStringsEachRowWithNamesAndTypes;
+SELECT 4;
+/* Check Totals */
+SELECT name, count() AS c FROM test_table GROUP BY name WITH TOTALS ORDER BY name FORMAT JSONCompactStringsEachRowWithNamesAndTypes;
+DROP TABLE IF EXISTS test_table;
+SELECT 5;
+/* Check JSONCompactStringsEachRow Input */
+CREATE TABLE test_table (v1 String, v2 UInt8, v3 DEFAULT v2 * 16, v4 UInt8 DEFAULT 8) ENGINE = MergeTree() ORDER BY v2;
+INSERT INTO test_table FORMAT JSONCompactStringsEachRow ["first", "1", "2", "NULL"] ["second", "2", "null", "6"];
+SELECT * FROM test_table FORMAT JSONCompactStringsEachRow;
+TRUNCATE TABLE test_table;
+SELECT 6;
+/* Check input_format_null_as_default = 1 */
+SET input_format_null_as_default = 1;
+INSERT INTO test_table FORMAT JSONCompactStringsEachRow ["first", "1", "2", "ᴺᵁᴸᴸ"] ["second", "2", "null", "6"];
+SELECT * FROM test_table FORMAT JSONCompactStringsEachRow;
+TRUNCATE TABLE test_table;
+SELECT 7;
+/* Check Nested */
+CREATE TABLE test_table_2 (v1 UInt8, n Nested(id UInt8, name String)) ENGINE = MergeTree() ORDER BY v1;
+INSERT INTO test_table_2 FORMAT JSONCompactStringsEachRow ["16", "[15, 16, 17]", "['first', 'second', 'third']"];
+SELECT * FROM test_table_2 FORMAT JSONCompactStringsEachRow;
+TRUNCATE TABLE test_table_2;
+SELECT 8;
+/* Check JSONCompactStringsEachRowWithNamesAndTypes Output */
+SET input_format_null_as_default = 0;
+INSERT INTO test_table FORMAT JSONCompactStringsEachRowWithNamesAndTypes ["v1", "v2", "v3", "v4"]["String","UInt8","UInt16","UInt8"]["first", "1", "2", "null"]["second", "2", "null", "6"];
+SELECT * FROM test_table FORMAT JSONCompactStringsEachRow;
+TRUNCATE TABLE test_table;
+SELECT 9;
+/* Check input_format_null_as_default = 1 */
+SET input_format_null_as_default = 1;
+INSERT INTO test_table FORMAT JSONCompactStringsEachRowWithNamesAndTypes ["v1", "v2", "v3", "v4"]["String","UInt8","UInt16","UInt8"]["first", "1", "2", "null"] ["second", "2", "null", "6"];
+SELECT * FROM test_table FORMAT JSONCompactStringsEachRow;
+SELECT 10;
+/* Check Header */
+TRUNCATE TABLE test_table;
+SET input_format_skip_unknown_fields = 1;
+INSERT INTO test_table FORMAT JSONCompactStringsEachRowWithNamesAndTypes ["v1", "v2", "invalid_column"]["String", "UInt8", "UInt8"]["first", "1", "32"]["second", "2", "64"];
+SELECT * FROM test_table FORMAT JSONCompactStringsEachRow;
+SELECT 11;
+TRUNCATE TABLE test_table;
+INSERT INTO test_table FORMAT JSONCompactStringsEachRowWithNamesAndTypes ["v4", "v2", "v3"]["UInt8", "UInt8", "UInt16"]["1", "2", "3"]
+SELECT * FROM test_table FORMAT JSONCompactStringsEachRowWithNamesAndTypes;
+SELECT 12;
+/* Check Nested */
+INSERT INTO test_table_2 FORMAT JSONCompactStringsEachRowWithNamesAndTypes ["v1", "n.id", "n.name"]["UInt8", "Array(UInt8)", "Array(String)"]["16", "[15, 16, 17]", "['first', 'second', 'third']"];
+SELECT * FROM test_table_2 FORMAT JSONCompactStringsEachRowWithNamesAndTypes;
+
+DROP TABLE IF EXISTS test_table;
+DROP TABLE IF EXISTS test_table_2;
diff --git a/tests/queries/0_stateless/01447_JSONStrings.reference b/tests/queries/0_stateless/01449_json_compact_strings.reference
similarity index 100%
rename from tests/queries/0_stateless/01447_JSONStrings.reference
rename to tests/queries/0_stateless/01449_json_compact_strings.reference
diff --git a/tests/queries/0_stateless/01449_json_compact_strings.sql b/tests/queries/0_stateless/01449_json_compact_strings.sql
new file mode 100644
index 00000000000..5b676e30347
--- /dev/null
+++ b/tests/queries/0_stateless/01449_json_compact_strings.sql
@@ -0,0 +1,10 @@
+SET output_format_write_statistics = 0;
+
+SELECT
+    1,
+    'a',
+    [1, 2, 3],
+    (1, 'a'),
+    null,
+    nan
+FORMAT JSONCompactStrings;

From 23b9677879a2a0618b35032439650ec08e760c57 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Fri, 4 Sep 2020 08:46:58 +0300
Subject: [PATCH 021/341] Added a script to import git repository to ClickHouse

---
 src/Common/ShellCommand.cpp                   |   4 +
 src/IO/ReadBufferFromFile.cpp                 |   3 +
 src/IO/WriteBufferFromFile.cpp                |   3 +
 utils/CMakeLists.txt                          |   1 +
 utils/git-to-clickhouse/CMakeLists.txt        |   2 +
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 638 ++++++++++++++++++
 6 files changed, 651 insertions(+)
 create mode 100644 utils/git-to-clickhouse/CMakeLists.txt
 create mode 100644 utils/git-to-clickhouse/git-to-clickhouse.cpp

diff --git a/src/Common/ShellCommand.cpp b/src/Common/ShellCommand.cpp
index 53ab2301a0a..127f95fef06 100644
--- a/src/Common/ShellCommand.cpp
+++ b/src/Common/ShellCommand.cpp
@@ -186,6 +186,10 @@ int ShellCommand::tryWait()
 {
     wait_called = true;
 
+    in.close();
+    out.close();
+    err.close();
+
     LOG_TRACE(getLogger(), "Will wait for shell command pid {}", pid);
 
     int status = 0;
diff --git a/src/IO/ReadBufferFromFile.cpp b/src/IO/ReadBufferFromFile.cpp
index 40f69625e68..226615c757e 100644
--- a/src/IO/ReadBufferFromFile.cpp
+++ b/src/IO/ReadBufferFromFile.cpp
@@ -77,6 +77,9 @@ ReadBufferFromFile::~ReadBufferFromFile()
 
 void ReadBufferFromFile::close()
 {
+    if (fd < 0)
+        return;
+
     if (0 != ::close(fd))
         throw Exception("Cannot close file", ErrorCodes::CANNOT_CLOSE_FILE);
 
diff --git a/src/IO/WriteBufferFromFile.cpp b/src/IO/WriteBufferFromFile.cpp
index b59a110edb4..4ade2e2c971 100644
--- a/src/IO/WriteBufferFromFile.cpp
+++ b/src/IO/WriteBufferFromFile.cpp
@@ -92,6 +92,9 @@ WriteBufferFromFile::~WriteBufferFromFile()
 /// Close file before destruction of object.
 void WriteBufferFromFile::close()
 {
+    if (fd < 0)
+        return;
+
     next();
 
     if (0 != ::close(fd))
diff --git a/utils/CMakeLists.txt b/utils/CMakeLists.txt
index 0dd95388e7d..dd03afe9fb8 100644
--- a/utils/CMakeLists.txt
+++ b/utils/CMakeLists.txt
@@ -29,6 +29,7 @@ if (NOT DEFINED ENABLE_UTILS OR ENABLE_UTILS)
     add_subdirectory (convert-month-partitioned-parts)
     add_subdirectory (checksum-for-compressed-block)
     add_subdirectory (wal-dump)
+    add_subdirectory (git-to-clickhouse)
 endif ()
 
 if (ENABLE_CODE_QUALITY)
diff --git a/utils/git-to-clickhouse/CMakeLists.txt b/utils/git-to-clickhouse/CMakeLists.txt
new file mode 100644
index 00000000000..0e46b68d471
--- /dev/null
+++ b/utils/git-to-clickhouse/CMakeLists.txt
@@ -0,0 +1,2 @@
+add_executable (git-to-clickhouse git-to-clickhouse.cpp)
+target_link_libraries(git-to-clickhouse PRIVATE dbms boost::program_options)
diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
new file mode 100644
index 00000000000..42920328ad7
--- /dev/null
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -0,0 +1,638 @@
+#include <cstdint>
+#include <string>
+#include <vector>
+
+#include <boost/program_options.hpp>
+
+#include <Common/Exception.h>
+#include <Common/StringUtils/StringUtils.h>
+#include <Common/ShellCommand.h>
+#include <common/find_symbols.h>
+
+#include <IO/copyData.h>
+#include <IO/ReadHelpers.h>
+#include <IO/WriteHelpers.h>
+#include <IO/WriteBufferFromFile.h>
+#include <IO/WriteBufferFromFileDescriptor.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int INCORRECT_DATA;
+}
+
+enum class LineType
+{
+    Empty,
+    Comment,
+    Punct,
+    Code,
+};
+
+void writeText(LineType type, WriteBuffer & out)
+{
+    switch (type)
+    {
+        case LineType::Empty: writeString("Empty", out); break;
+        case LineType::Comment: writeString("Comment", out); break;
+        case LineType::Punct: writeString("Punct", out); break;
+        case LineType::Code: writeString("Code", out); break;
+    }
+}
+
+struct LineChange
+{
+    int8_t sign{}; /// 1 if added, -1 if deleted
+    uint16_t line_number_old{};
+    uint16_t line_number_new{};
+    uint16_t hunk_num{}; /// ordinal number of hunk in diff, starting with 0
+    uint16_t hunk_start_line_number_old{};
+    uint16_t hunk_start_line_number_new{};
+    std::string hunk_context; /// The context (like a line with function name) as it is calculated by git
+    std::string line; /// Line content without leading whitespaces
+    uint8_t indent{}; /// The number of leading whitespaces or tabs * 4
+    LineType line_type{};
+
+    void setLineInfo(std::string full_line)
+    {
+        indent = 0;
+
+        const char * pos = full_line.data();
+        const char * end = pos + full_line.size();
+
+        while (pos < end)
+        {
+            if (*pos == ' ')
+                ++indent;
+            else if (*pos == '\t')
+                indent += 4;
+            else
+                break;
+            ++pos;
+        }
+
+        line.assign(pos, end);
+
+        if (pos == end)
+        {
+            line_type = LineType::Empty;
+        }
+        else if (pos + 1 < end
+            && ((pos[0] == '/' && pos[1] == '/')
+                || (pos[0] == '*' && pos[1] == ' '))) /// This is not precise.
+        {
+            line_type = LineType::Comment;
+        }
+        else
+        {
+            while (pos < end)
+            {
+                if (isAlphaNumericASCII(*pos))
+                {
+                    line_type = LineType::Code;
+                    break;
+                }
+                ++pos;
+            }
+            if (pos == end)
+                line_type = LineType::Punct;
+        }
+    }
+
+    void writeTextWithoutNewline(WriteBuffer & out) const
+    {
+        writeText(sign, out);
+        writeChar('\t', out);
+        writeText(line_number_old, out);
+        writeChar('\t', out);
+        writeText(line_number_new, out);
+        writeChar('\t', out);
+        writeText(hunk_num, out);
+        writeChar('\t', out);
+        writeText(hunk_start_line_number_old, out);
+        writeChar('\t', out);
+        writeText(hunk_start_line_number_new, out);
+        writeChar('\t', out);
+        writeText(hunk_context, out);
+        writeChar('\t', out);
+        writeText(line, out);
+        writeChar('\t', out);
+        writeText(indent, out);
+        writeChar('\t', out);
+        writeText(line_type, out);
+    }
+};
+
+using LineChanges = std::vector<LineChange>;
+
+enum class FileChangeType
+{
+    Add,
+    Delete,
+    Modify,
+    Rename,
+    Copy,
+    Type,
+};
+
+void writeText(FileChangeType type, WriteBuffer & out)
+{
+    switch (type)
+    {
+        case FileChangeType::Add: writeString("Add", out); break;
+        case FileChangeType::Delete: writeString("Delete", out); break;
+        case FileChangeType::Modify: writeString("Modify", out); break;
+        case FileChangeType::Rename: writeString("Rename", out); break;
+        case FileChangeType::Copy: writeString("Copy", out); break;
+        case FileChangeType::Type: writeString("Type", out); break;
+    }
+}
+
+struct FileChange
+{
+    FileChangeType change_type{};
+    std::string new_file_path;
+    std::string old_file_path;
+    uint16_t lines_added{};
+    uint16_t lines_deleted{};
+    uint16_t hunks_added{};
+    uint16_t hunks_removed{};
+    uint16_t hunks_changed{};
+
+    void writeTextWithoutNewline(WriteBuffer & out) const
+    {
+        writeText(change_type, out);
+        writeChar('\t', out);
+        writeText(new_file_path, out);
+        writeChar('\t', out);
+        writeText(old_file_path, out);
+        writeChar('\t', out);
+        writeText(lines_added, out);
+        writeChar('\t', out);
+        writeText(lines_deleted, out);
+        writeChar('\t', out);
+        writeText(hunks_added, out);
+        writeChar('\t', out);
+        writeText(hunks_removed, out);
+        writeChar('\t', out);
+        writeText(hunks_changed, out);
+    }
+};
+
+struct FileChangeAndLineChanges
+{
+    FileChange file_change;
+    LineChanges line_changes;
+};
+
+struct Commit
+{
+    std::string hash;
+    std::string author_name;
+    std::string author_email;
+    time_t time{};
+    std::string message;
+    uint32_t files_added{};
+    uint32_t files_deleted{};
+    uint32_t files_renamed{};
+    uint32_t files_modified{};
+    uint32_t lines_added{};
+    uint32_t lines_deleted{};
+    uint32_t hunks_added{};
+    uint32_t hunks_removed{};
+    uint32_t hunks_changed{};
+
+    void writeTextWithoutNewline(WriteBuffer & out) const
+    {
+        writeText(hash, out);
+        writeChar('\t', out);
+        writeText(author_name, out);
+        writeChar('\t', out);
+        writeText(author_email, out);
+        writeChar('\t', out);
+        writeText(time, out);
+        writeChar('\t', out);
+        writeText(message, out);
+        writeChar('\t', out);
+        writeText(files_added, out);
+        writeChar('\t', out);
+        writeText(files_deleted, out);
+        writeChar('\t', out);
+        writeText(files_renamed, out);
+        writeChar('\t', out);
+        writeText(files_modified, out);
+        writeChar('\t', out);
+        writeText(lines_added, out);
+        writeChar('\t', out);
+        writeText(lines_deleted, out);
+        writeChar('\t', out);
+        writeText(hunks_added, out);
+        writeChar('\t', out);
+        writeText(hunks_removed, out);
+        writeChar('\t', out);
+        writeText(hunks_changed, out);
+    }
+};
+
+
+void skipUntilWhitespace(ReadBuffer & buf)
+{
+    while (!buf.eof())
+    {
+        char * next_pos = find_first_symbols<'\t', '\n', ' '>(buf.position(), buf.buffer().end());
+        buf.position() = next_pos;
+
+        if (!buf.hasPendingData())
+            continue;
+
+        if (*buf.position() == '\t' || *buf.position() == '\n' || *buf.position() == ' ')
+            return;
+    }
+}
+
+void skipUntilNextLine(ReadBuffer & buf)
+{
+    while (!buf.eof())
+    {
+        char * next_pos = find_first_symbols<'\n'>(buf.position(), buf.buffer().end());
+        buf.position() = next_pos;
+
+        if (!buf.hasPendingData())
+            continue;
+
+        if (*buf.position() == '\n')
+        {
+            ++buf.position();
+            return;
+        }
+    }
+}
+
+void readStringUntilNextLine(std::string & s, ReadBuffer & buf)
+{
+    s.clear();
+    while (!buf.eof())
+    {
+        char * next_pos = find_first_symbols<'\n'>(buf.position(), buf.buffer().end());
+        s.append(buf.position(), next_pos - buf.position());
+        buf.position() = next_pos;
+
+        if (!buf.hasPendingData())
+            continue;
+
+        if (*buf.position() == '\n')
+        {
+            ++buf.position();
+            return;
+        }
+    }
+}
+
+
+struct Result
+{
+    WriteBufferFromFile commits{"commits.tsv"};
+    WriteBufferFromFile file_changes{"file_changes.tsv"};
+    WriteBufferFromFile line_changes{"line_changes.tsv"};
+};
+
+
+void processCommit(std::string hash, Result & result)
+{
+    std::string command = fmt::format(
+        "git show --raw --pretty='format:%at%x09%aN%x09%aE%x0A%s%x00' --patch --unified=0 {}",
+        hash);
+
+    std::cerr << command << "\n";
+
+    auto commit_info = ShellCommand::execute(command);
+    auto & in = commit_info->out;
+
+    Commit commit;
+    commit.hash = hash;
+
+    readText(commit.time, in);
+    assertChar('\t', in);
+    readText(commit.author_name, in);
+    assertChar('\t', in);
+    readText(commit.author_email, in);
+    assertChar('\n', in);
+    readNullTerminated(commit.message, in);
+
+    std::cerr << fmt::format("{}\t{}\n", toString(LocalDateTime(commit.time)), commit.message);
+
+    if (!in.eof())
+        assertChar('\n', in);
+
+    /// File changes in form
+    /// :100644 100644 b90fe6bb94 3ffe4c380f M  src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+    /// :100644 100644 828dedf6b5 828dedf6b5 R100       dbms/src/Functions/GeoUtils.h   dbms/src/Functions/PolygonUtils.h
+
+    std::map<std::string, FileChangeAndLineChanges> file_changes;
+
+    while (checkChar(':', in))
+    {
+        FileChange file_change;
+
+        for (size_t i = 0; i < 4; ++i)
+        {
+            skipUntilWhitespace(in);
+            skipWhitespaceIfAny(in);
+        }
+
+        char change_type;
+        readChar(change_type, in);
+
+        int confidence;
+        switch (change_type)
+        {
+            case 'A':
+                file_change.change_type = FileChangeType::Add;
+                ++commit.files_added;
+                break;
+            case 'D':
+                file_change.change_type = FileChangeType::Delete;
+                ++commit.files_deleted;
+                break;
+            case 'M':
+                file_change.change_type = FileChangeType::Modify;
+                ++commit.files_modified;
+                break;
+            case 'R':
+                file_change.change_type = FileChangeType::Rename;
+                ++commit.files_renamed;
+                readText(confidence, in);
+                break;
+            case 'C':
+                file_change.change_type = FileChangeType::Copy;
+                readText(confidence, in);
+                break;
+            case 'T':
+                file_change.change_type = FileChangeType::Type;
+                break;
+            default:
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected file change type: {}", change_type);
+        }
+
+        skipWhitespaceIfAny(in);
+
+        if (change_type == 'R' || change_type == 'C')
+        {
+            readText(file_change.old_file_path, in);
+            skipWhitespaceIfAny(in);
+            readText(file_change.new_file_path, in);
+        }
+        else
+        {
+            readText(file_change.new_file_path, in);
+        }
+
+        assertChar('\n', in);
+
+        file_changes.emplace(
+            file_change.new_file_path,
+            FileChangeAndLineChanges{ file_change, {} });
+    }
+
+    if (!in.eof())
+    {
+        assertChar('\n', in);
+
+        /// Diffs for every file in form of
+        /// --- a/src/Storages/StorageReplicatedMergeTree.cpp
+        /// +++ b/src/Storages/StorageReplicatedMergeTree.cpp
+        /// @@ -1387,2 +1387 @@ bool StorageReplicatedMergeTree::tryExecuteMerge(const LogEntry & entry)
+        /// -            table_lock, entry.create_time, reserved_space, entry.deduplicate,
+        /// -            entry.force_ttl);
+        /// +            table_lock, entry.create_time, reserved_space, entry.deduplicate);
+
+        std::string old_file_path;
+        std::string new_file_path;
+        FileChangeAndLineChanges * file_change_and_line_changes = nullptr;
+        LineChange line_change;
+
+        while (!in.eof())
+        {
+            if (checkString("@@ ", in))
+            {
+                if (!file_change_and_line_changes)
+                {
+                    auto file_name = new_file_path.empty() ? old_file_path : new_file_path;
+                    auto it = file_changes.find(file_name);
+                    if (file_changes.end() == it)
+                        std::cerr << fmt::format("Warning: skipping bad file name {}\n", file_name);
+                    else
+                        file_change_and_line_changes = &it->second;
+                }
+
+                if (file_change_and_line_changes)
+                {
+                    uint16_t old_lines = 1;
+                    uint16_t new_lines = 1;
+
+                    assertChar('-', in);
+                    readText(line_change.hunk_start_line_number_old, in);
+                    if (checkChar(',', in))
+                        readText(old_lines, in);
+
+                    assertString(" +", in);
+                    readText(line_change.hunk_start_line_number_new, in);
+                    if (checkChar(',', in))
+                        readText(new_lines, in);
+
+                    assertString(" @@", in);
+                    if (checkChar(' ', in))
+                        readStringUntilNextLine(line_change.hunk_context, in);
+                    else
+                        assertChar('\n', in);
+
+                    ++line_change.hunk_num;
+                    line_change.line_number_old = line_change.hunk_start_line_number_old;
+                    line_change.line_number_new = line_change.hunk_start_line_number_new;
+
+                    if (old_lines && new_lines)
+                    {
+                        ++commit.hunks_changed;
+                        ++file_change_and_line_changes->file_change.hunks_changed;
+                    }
+                    else if (old_lines)
+                    {
+                        ++commit.hunks_removed;
+                        ++file_change_and_line_changes->file_change.hunks_removed;
+                    }
+                    else if (new_lines)
+                    {
+                        ++commit.hunks_added;
+                        ++file_change_and_line_changes->file_change.hunks_added;
+                    }
+                }
+            }
+            else if (checkChar('-', in))
+            {
+                if (checkString("-- ", in))
+                {
+                    if (checkString("a/", in))
+                    {
+                        readStringUntilNextLine(old_file_path, in);
+                        line_change = LineChange{};
+                        file_change_and_line_changes = nullptr;
+                    }
+                    else if (checkString("/dev/null", in))
+                    {
+                        old_file_path.clear();
+                        assertChar('\n', in);
+                        line_change = LineChange{};
+                        file_change_and_line_changes = nullptr;
+                    }
+                    else
+                        skipUntilNextLine(in); /// Actually it can be the line in diff. Skip it for simplicity.
+                }
+                else
+                {
+                    if (file_change_and_line_changes)
+                    {
+                        ++commit.lines_deleted;
+
+                        line_change.sign = -1;
+                        readStringUntilNextLine(line_change.line, in);
+                        line_change.setLineInfo(line_change.line);
+
+                        file_change_and_line_changes->line_changes.push_back(line_change);
+                        ++line_change.line_number_old;
+                    }
+                }
+            }
+            else if (checkChar('+', in))
+            {
+                if (checkString("++ ", in))
+                {
+                    if (checkString("b/", in))
+                    {
+                        readStringUntilNextLine(new_file_path, in);
+                        line_change = LineChange{};
+                        file_change_and_line_changes = nullptr;
+                    }
+                    else if (checkString("/dev/null", in))
+                    {
+                        new_file_path.clear();
+                        assertChar('\n', in);
+                        line_change = LineChange{};
+                        file_change_and_line_changes = nullptr;
+                    }
+                    else
+                        skipUntilNextLine(in); /// Actually it can be the line in diff. Skip it for simplicity.
+                }
+                else
+                {
+                    if (file_change_and_line_changes)
+                    {
+                        ++commit.lines_added;
+
+                        line_change.sign = 1;
+                        readStringUntilNextLine(line_change.line, in);
+                        line_change.setLineInfo(line_change.line);
+
+                        file_change_and_line_changes->line_changes.push_back(line_change);
+                        ++line_change.line_number_new;
+                    }
+                }
+            }
+            else
+            {
+                skipUntilNextLine(in);
+            }
+        }
+    }
+
+    /// Write the result
+
+    /// commits table
+    {
+        auto & out = result.commits;
+
+        commit.writeTextWithoutNewline(out);
+        writeChar('\n', out);
+    }
+
+    for (const auto & elem : file_changes)
+    {
+        const FileChange & file_change = elem.second.file_change;
+
+        /// file_changes table
+        {
+            auto & out = result.file_changes;
+
+            file_change.writeTextWithoutNewline(out);
+            writeChar('\t', out);
+            commit.writeTextWithoutNewline(out);
+            writeChar('\n', out);
+        }
+
+        /// line_changes table
+        for (const auto & line_change : elem.second.line_changes)
+        {
+            auto & out = result.line_changes;
+
+            line_change.writeTextWithoutNewline(out);
+            writeChar('\t', out);
+            file_change.writeTextWithoutNewline(out);
+            writeChar('\t', out);
+            commit.writeTextWithoutNewline(out);
+            writeChar('\n', out);
+        }
+    }
+}
+
+
+void processLog()
+{
+    Result result;
+
+    std::string command = "git log --no-merges --pretty=%H";
+    std::cerr << command << "\n";
+    auto git_log = ShellCommand::execute(command);
+
+    auto & in = git_log->out;
+    while (!in.eof())
+    {
+        std::string hash;
+        readString(hash, in);
+        assertChar('\n', in);
+
+        std::cerr << fmt::format("Processing commit {}\n", hash);
+        processCommit(std::move(hash), result);
+    }
+}
+
+
+}
+
+int main(int /*argc*/, char ** /*argv*/)
+try
+{
+    using namespace DB;
+
+/*    boost::program_options::options_description desc("Allowed options");
+    desc.add_options()("help,h", "produce help message");
+
+    boost::program_options::variables_map options;
+    boost::program_options::store(boost::program_options::parse_command_line(argc, argv, desc), options);
+
+    if (options.count("help") || argc != 2)
+    {
+        std::cout << "Usage: " << argv[0] << std::endl;
+        std::cout << desc << std::endl;
+        return 1;
+    }*/
+
+    processLog();
+    return 0;
+}
+catch (...)
+{
+    std::cerr << DB::getCurrentExceptionMessage(true) << '\n';
+    throw;
+}

From 338a6e20f60bb21c99ee2c4f261d96bc55ec4b97 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Fri, 4 Sep 2020 09:12:16 +0300
Subject: [PATCH 022/341] Added a script to import git repository to ClickHouse

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 97 +++++++++++++++++++
 1 file changed, 97 insertions(+)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 42920328ad7..314bba0d5b4 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -16,6 +16,101 @@
 #include <IO/WriteBufferFromFileDescriptor.h>
 
 
+/** How to use:
+
+DROP DATABASE IF EXISTS git;
+CREATE DATABASE git;
+
+CREATE TABLE git.commits
+(
+    hash String,
+    author_name LowCardinality(String),
+    author_email LowCardinality(String),
+    time DateTime,
+    message String,
+    files_added UInt32,
+    files_deleted UInt32,
+    files_renamed UInt32,
+    files_modified UInt32,
+    lines_added UInt32,
+    lines_deleted UInt32,
+    hunks_added UInt32,
+    hunks_removed UInt32,
+    hunks_changed UInt32
+) ENGINE = MergeTree ORDER BY time;
+
+CREATE TABLE git.file_changes
+(
+    change_type Enum('Add' = 1, 'Delete' = 2, 'Modify' = 3, 'Rename' = 4, 'Copy' = 5, 'Type' = 6),
+    new_file_path LowCardinality(String),
+    old_file_path LowCardinality(String),
+    lines_added UInt16,
+    lines_deleted UInt16,
+    hunks_added UInt16,
+    hunks_removed UInt16,
+    hunks_changed UInt16,
+
+    commit_hash String,
+    author_name LowCardinality(String),
+    author_email LowCardinality(String),
+    time DateTime,
+    commit_message String,
+    commit_files_added UInt32,
+    commit_files_deleted UInt32,
+    commit_files_renamed UInt32,
+    commit_files_modified UInt32,
+    commit_lines_added UInt32,
+    commit_lines_deleted UInt32,
+    commit_hunks_added UInt32,
+    commit_hunks_removed UInt32,
+    commit_hunks_changed UInt32
+) ENGINE = MergeTree ORDER BY time;
+
+CREATE TABLE git.line_changes
+(
+    sign Int8,
+    line_number_old UInt16,
+    line_number_new UInt16,
+    hunk_num UInt16,
+    hunk_start_line_number_old UInt16,
+    hunk_start_line_number_new UInt16,
+    hunk_context LowCardinality(String),
+    line LowCardinality(String),
+    indent UInt8,
+    line_type Enum('Empty' = 0, 'Comment' = 1, 'Punct' = 2, 'Code' = 3),
+
+    file_change_type Enum('Add' = 1, 'Delete' = 2, 'Modify' = 3, 'Rename' = 4, 'Copy' = 5, 'Type' = 6),
+    new_file_path LowCardinality(String),
+    old_file_path LowCardinality(String),
+    file_lines_added UInt16,
+    file_lines_deleted UInt16,
+    file_hunks_added UInt16,
+    file_hunks_removed UInt16,
+    file_hunks_changed UInt16,
+
+    commit_hash String,
+    author_name LowCardinality(String),
+    author_email LowCardinality(String),
+    time DateTime,
+    commit_message String,
+    commit_files_added UInt32,
+    commit_files_deleted UInt32,
+    commit_files_renamed UInt32,
+    commit_files_modified UInt32,
+    commit_lines_added UInt32,
+    commit_lines_deleted UInt32,
+    commit_hunks_added UInt32,
+    commit_hunks_removed UInt32,
+    commit_hunks_changed UInt32
+) ENGINE = MergeTree ORDER BY time;
+
+clickhouse-client --query "INSERT INTO git.commits FORMAT TSV" < commits.tsv
+clickhouse-client --query "INSERT INTO git.file_changes FORMAT TSV" < file_changes.tsv
+clickhouse-client --query "INSERT INTO git.line_changes FORMAT TSV" < line_changes.tsv
+
+  */
+
+
 namespace DB
 {
 
@@ -495,6 +590,7 @@ void processCommit(std::string hash, Result & result)
                     if (file_change_and_line_changes)
                     {
                         ++commit.lines_deleted;
+                        ++file_change_and_line_changes->file_change.lines_deleted;
 
                         line_change.sign = -1;
                         readStringUntilNextLine(line_change.line, in);
@@ -530,6 +626,7 @@ void processCommit(std::string hash, Result & result)
                     if (file_change_and_line_changes)
                     {
                         ++commit.lines_added;
+                        ++file_change_and_line_changes->file_change.lines_added;
 
                         line_change.sign = 1;
                         readStringUntilNextLine(line_change.line, in);

From 7b95e56e8c902578f8fcebc5d9edeccce1eb35ee Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 6 Sep 2020 03:09:40 +0300
Subject: [PATCH 023/341] Advancements

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 187 +++++++++++++-----
 1 file changed, 133 insertions(+), 54 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 314bba0d5b4..d6264a63978 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -1,6 +1,11 @@
 #include <cstdint>
 #include <string>
 #include <vector>
+#include <algorithm>
+#include <cctype>
+#include <unordered_set>
+
+#include <re2_st/re2.h>
 
 #include <boost/program_options.hpp>
 
@@ -16,7 +21,8 @@
 #include <IO/WriteBufferFromFileDescriptor.h>
 
 
-/** How to use:
+static constexpr auto documentation = R"(
+Prepare the database by executing the following queries:
 
 DROP DATABASE IF EXISTS git;
 CREATE DATABASE git;
@@ -44,11 +50,11 @@ CREATE TABLE git.file_changes
     change_type Enum('Add' = 1, 'Delete' = 2, 'Modify' = 3, 'Rename' = 4, 'Copy' = 5, 'Type' = 6),
     new_file_path LowCardinality(String),
     old_file_path LowCardinality(String),
-    lines_added UInt16,
-    lines_deleted UInt16,
-    hunks_added UInt16,
-    hunks_removed UInt16,
-    hunks_changed UInt16,
+    lines_added UInt32,
+    lines_deleted UInt32,
+    hunks_added UInt32,
+    hunks_removed UInt32,
+    hunks_changed UInt32,
 
     commit_hash String,
     author_name LowCardinality(String),
@@ -69,11 +75,11 @@ CREATE TABLE git.file_changes
 CREATE TABLE git.line_changes
 (
     sign Int8,
-    line_number_old UInt16,
-    line_number_new UInt16,
-    hunk_num UInt16,
-    hunk_start_line_number_old UInt16,
-    hunk_start_line_number_new UInt16,
+    line_number_old UInt32,
+    line_number_new UInt32,
+    hunk_num UInt32,
+    hunk_start_line_number_old UInt32,
+    hunk_start_line_number_new UInt32,
     hunk_context LowCardinality(String),
     line LowCardinality(String),
     indent UInt8,
@@ -82,11 +88,11 @@ CREATE TABLE git.line_changes
     file_change_type Enum('Add' = 1, 'Delete' = 2, 'Modify' = 3, 'Rename' = 4, 'Copy' = 5, 'Type' = 6),
     new_file_path LowCardinality(String),
     old_file_path LowCardinality(String),
-    file_lines_added UInt16,
-    file_lines_deleted UInt16,
-    file_hunks_added UInt16,
-    file_hunks_removed UInt16,
-    file_hunks_changed UInt16,
+    file_lines_added UInt32,
+    file_lines_deleted UInt32,
+    file_hunks_added UInt32,
+    file_hunks_removed UInt32,
+    file_hunks_changed UInt32,
 
     commit_hash String,
     author_name LowCardinality(String),
@@ -104,12 +110,15 @@ CREATE TABLE git.line_changes
     commit_hunks_changed UInt32
 ) ENGINE = MergeTree ORDER BY time;
 
+Insert the data with the following commands:
+
 clickhouse-client --query "INSERT INTO git.commits FORMAT TSV" < commits.tsv
 clickhouse-client --query "INSERT INTO git.file_changes FORMAT TSV" < file_changes.tsv
 clickhouse-client --query "INSERT INTO git.line_changes FORMAT TSV" < line_changes.tsv
 
-  */
+)";
 
+namespace po = boost::program_options;
 
 namespace DB
 {
@@ -141,11 +150,11 @@ void writeText(LineType type, WriteBuffer & out)
 struct LineChange
 {
     int8_t sign{}; /// 1 if added, -1 if deleted
-    uint16_t line_number_old{};
-    uint16_t line_number_new{};
-    uint16_t hunk_num{}; /// ordinal number of hunk in diff, starting with 0
-    uint16_t hunk_start_line_number_old{};
-    uint16_t hunk_start_line_number_new{};
+    uint32_t line_number_old{};
+    uint32_t line_number_new{};
+    uint32_t hunk_num{}; /// ordinal number of hunk in diff, starting with 0
+    uint32_t hunk_start_line_number_old{};
+    uint32_t hunk_start_line_number_new{};
     std::string hunk_context; /// The context (like a line with function name) as it is calculated by git
     std::string line; /// Line content without leading whitespaces
     uint8_t indent{}; /// The number of leading whitespaces or tabs * 4
@@ -251,11 +260,11 @@ struct FileChange
     FileChangeType change_type{};
     std::string new_file_path;
     std::string old_file_path;
-    uint16_t lines_added{};
-    uint16_t lines_deleted{};
-    uint16_t hunks_added{};
-    uint16_t hunks_removed{};
-    uint16_t hunks_changed{};
+    uint32_t lines_added{};
+    uint32_t lines_deleted{};
+    uint32_t hunks_added{};
+    uint32_t hunks_removed{};
+    uint32_t hunks_changed{};
 
     void writeTextWithoutNewline(WriteBuffer & out) const
     {
@@ -395,13 +404,38 @@ struct Result
 };
 
 
-void processCommit(std::string hash, Result & result)
+struct Options
+{
+    bool skip_commits_without_parents = true;
+    std::optional<re2_st::RE2> skip_paths;
+    std::unordered_set<std::string> skip_commits;
+    size_t diff_size_limit = 0;
+
+    Options(const po::variables_map & options)
+    {
+        skip_commits_without_parents = options["skip-commits-without-parents"].as<bool>();
+        if (options.count("skip-paths"))
+        {
+            skip_paths.emplace(options["skip-paths"].as<std::string>());
+        }
+        if (options.count("skip-commit"))
+        {
+            auto vec = options["skip-commit"].as<std::vector<std::string>>();
+            skip_commits.insert(vec.begin(), vec.end());
+        }
+        diff_size_limit = options["diff-size-limit"].as<size_t>();
+    }
+};
+
+
+void processCommit(
+    const Options & options, size_t commit_num, size_t total_commits, std::string hash, Result & result)
 {
     std::string command = fmt::format(
-        "git show --raw --pretty='format:%at%x09%aN%x09%aE%x0A%s%x00' --patch --unified=0 {}",
+        "git show --raw --pretty='format:%at%x09%aN%x09%aE%x09%P%x0A%s%x00' --patch --unified=0 {}",
         hash);
 
-    std::cerr << command << "\n";
+    //std::cerr << command << "\n";
 
     auto commit_info = ShellCommand::execute(command);
     auto & in = commit_info->out;
@@ -414,10 +448,23 @@ void processCommit(std::string hash, Result & result)
     readText(commit.author_name, in);
     assertChar('\t', in);
     readText(commit.author_email, in);
+    assertChar('\t', in);
+    std::string parent_hash;
+    readString(parent_hash, in);
     assertChar('\n', in);
     readNullTerminated(commit.message, in);
 
-    std::cerr << fmt::format("{}\t{}\n", toString(LocalDateTime(commit.time)), commit.message);
+    std::string message_to_print = commit.message;
+    std::replace_if(message_to_print.begin(), message_to_print.end(), [](char c){ return std::iscntrl(c); }, ' ');
+
+    fmt::print("{}%  {}  {}  {}\n",
+        commit_num * 100 / total_commits, toString(LocalDateTime(commit.time)), hash, message_to_print);
+
+    if (options.skip_commits_without_parents && commit_num != 0 && parent_hash.empty())
+    {
+        std::cerr << "Warning: skipping commit without parents\n";
+        return;
+    }
 
     if (!in.eof())
         assertChar('\n', in);
@@ -487,9 +534,12 @@ void processCommit(std::string hash, Result & result)
 
         assertChar('\n', in);
 
-        file_changes.emplace(
-            file_change.new_file_path,
-            FileChangeAndLineChanges{ file_change, {} });
+        if (!(options.skip_paths && re2_st::RE2::PartialMatch(file_change.new_file_path, *options.skip_paths)))
+        {
+            file_changes.emplace(
+                file_change.new_file_path,
+                FileChangeAndLineChanges{ file_change, {} });
+        }
     }
 
     if (!in.eof())
@@ -517,16 +567,14 @@ void processCommit(std::string hash, Result & result)
                 {
                     auto file_name = new_file_path.empty() ? old_file_path : new_file_path;
                     auto it = file_changes.find(file_name);
-                    if (file_changes.end() == it)
-                        std::cerr << fmt::format("Warning: skipping bad file name {}\n", file_name);
-                    else
+                    if (file_changes.end() != it)
                         file_change_and_line_changes = &it->second;
                 }
 
                 if (file_change_and_line_changes)
                 {
-                    uint16_t old_lines = 1;
-                    uint16_t new_lines = 1;
+                    uint32_t old_lines = 1;
+                    uint32_t new_lines = 1;
 
                     assertChar('-', in);
                     readText(line_change.hunk_start_line_number_old, in);
@@ -644,6 +692,9 @@ void processCommit(std::string hash, Result & result)
         }
     }
 
+    if (commit.lines_added + commit.lines_deleted > options.diff_size_limit)
+        return;
+
     /// Write the result
 
     /// commits table
@@ -684,14 +735,20 @@ void processCommit(std::string hash, Result & result)
 }
 
 
-void processLog()
+void processLog(const Options & options)
 {
     Result result;
 
-    std::string command = "git log --no-merges --pretty=%H";
-    std::cerr << command << "\n";
+    std::string command = "git log --reverse --no-merges --pretty=%H";
+    fmt::print("{}\n", command);
     auto git_log = ShellCommand::execute(command);
 
+    /// Collect hashes in memory. This is inefficient but allows to display beautiful progress.
+    /// The number of commits is in order of single millions for the largest repositories,
+    /// so don't care about potential waste of ~100 MB of memory.
+
+    std::vector<std::string> hashes;
+
     auto & in = git_log->out;
     while (!in.eof())
     {
@@ -699,33 +756,55 @@ void processLog()
         readString(hash, in);
         assertChar('\n', in);
 
-        std::cerr << fmt::format("Processing commit {}\n", hash);
-        processCommit(std::move(hash), result);
+        if (!options.skip_commits.count(hash))
+            hashes.emplace_back(std::move(hash));
+    }
+
+    size_t num_commits = hashes.size();
+    fmt::print("Total {} commits to process.\n", num_commits);
+
+    for (size_t i = 0; i < num_commits; ++i)
+    {
+        processCommit(options, i, num_commits, hashes[i], result);
     }
 }
 
 
 }
 
-int main(int /*argc*/, char ** /*argv*/)
+int main(int argc, char ** argv)
 try
 {
     using namespace DB;
 
-/*    boost::program_options::options_description desc("Allowed options");
-    desc.add_options()("help,h", "produce help message");
+    po::options_description desc("Allowed options");
+    desc.add_options()
+        ("help,h", "produce help message")
+        ("skip-commits-without-parents", po::value<bool>()->default_value(true),
+            "Skip commits without parents (except the initial commit)."
+            " These commits are usually erroneous but they can make sense in very rare cases.")
+        ("skip-paths", po::value<std::string>(),
+            "Skip paths that matches regular expression (re2 syntax).")
+        ("skip-commit", po::value<std::vector<std::string>>(),
+            "Skip commit with specified hash. The option can be specified multiple times.")
+        ("diff-size-limit", po::value<size_t>()->default_value(0),
+            "Skip commits whose diff size (number of added + removed lines) is larger than specified threshold")
+    ;
 
-    boost::program_options::variables_map options;
-    boost::program_options::store(boost::program_options::parse_command_line(argc, argv, desc), options);
+    po::variables_map options;
+    po::store(boost::program_options::parse_command_line(argc, argv, desc), options);
 
-    if (options.count("help") || argc != 2)
+    if (options.count("help"))
     {
-        std::cout << "Usage: " << argv[0] << std::endl;
-        std::cout << desc << std::endl;
+        std::cout << documentation << '\n'
+            << "Usage: " << argv[0] << '\n'
+            << desc << '\n'
+            << "\nExample:\n"
+            << "\n./git-to-clickhouse --diff-size-limit 100000 --skip-paths '^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/'\n";
         return 1;
-    }*/
+    }
 
-    processLog();
+    processLog(options);
     return 0;
 }
 catch (...)

From abe836a584aeaf71b0ba04b8c8cc670385519e94 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 6 Sep 2020 03:13:39 +0300
Subject: [PATCH 024/341] Remove emails as they are mostly useless

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 20 ++++++-------------
 1 file changed, 6 insertions(+), 14 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index d6264a63978..9203efb0043 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -30,8 +30,7 @@ CREATE DATABASE git;
 CREATE TABLE git.commits
 (
     hash String,
-    author_name LowCardinality(String),
-    author_email LowCardinality(String),
+    author LowCardinality(String),
     time DateTime,
     message String,
     files_added UInt32,
@@ -57,8 +56,7 @@ CREATE TABLE git.file_changes
     hunks_changed UInt32,
 
     commit_hash String,
-    author_name LowCardinality(String),
-    author_email LowCardinality(String),
+    author LowCardinality(String),
     time DateTime,
     commit_message String,
     commit_files_added UInt32,
@@ -95,8 +93,7 @@ CREATE TABLE git.line_changes
     file_hunks_changed UInt32,
 
     commit_hash String,
-    author_name LowCardinality(String),
-    author_email LowCardinality(String),
+    author LowCardinality(String),
     time DateTime,
     commit_message String,
     commit_files_added UInt32,
@@ -295,8 +292,7 @@ struct FileChangeAndLineChanges
 struct Commit
 {
     std::string hash;
-    std::string author_name;
-    std::string author_email;
+    std::string author;
     time_t time{};
     std::string message;
     uint32_t files_added{};
@@ -313,9 +309,7 @@ struct Commit
     {
         writeText(hash, out);
         writeChar('\t', out);
-        writeText(author_name, out);
-        writeChar('\t', out);
-        writeText(author_email, out);
+        writeText(author, out);
         writeChar('\t', out);
         writeText(time, out);
         writeChar('\t', out);
@@ -445,9 +439,7 @@ void processCommit(
 
     readText(commit.time, in);
     assertChar('\t', in);
-    readText(commit.author_name, in);
-    assertChar('\t', in);
-    readText(commit.author_email, in);
+    readText(commit.author, in);
     assertChar('\t', in);
     std::string parent_hash;
     readString(parent_hash, in);

From 09978decbdf40c95e7cd8855ad804a2ad31cc09d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 6 Sep 2020 03:47:00 +0300
Subject: [PATCH 025/341] Adjustments

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 52 +++++++++++++------
 1 file changed, 35 insertions(+), 17 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 9203efb0043..a81bc6679a7 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -4,6 +4,7 @@
 #include <algorithm>
 #include <cctype>
 #include <unordered_set>
+#include <filesystem>
 
 #include <re2_st/re2.h>
 
@@ -47,8 +48,9 @@ CREATE TABLE git.commits
 CREATE TABLE git.file_changes
 (
     change_type Enum('Add' = 1, 'Delete' = 2, 'Modify' = 3, 'Rename' = 4, 'Copy' = 5, 'Type' = 6),
-    new_file_path LowCardinality(String),
-    old_file_path LowCardinality(String),
+    path LowCardinality(String),
+    old_path LowCardinality(String),
+    file_extension LowCardinality(String),
     lines_added UInt32,
     lines_deleted UInt32,
     hunks_added UInt32,
@@ -84,8 +86,9 @@ CREATE TABLE git.line_changes
     line_type Enum('Empty' = 0, 'Comment' = 1, 'Punct' = 2, 'Code' = 3),
 
     file_change_type Enum('Add' = 1, 'Delete' = 2, 'Modify' = 3, 'Rename' = 4, 'Copy' = 5, 'Type' = 6),
-    new_file_path LowCardinality(String),
-    old_file_path LowCardinality(String),
+    path LowCardinality(String),
+    old_path LowCardinality(String),
+    file_extension LowCardinality(String),
     file_lines_added UInt32,
     file_lines_deleted UInt32,
     file_hunks_added UInt32,
@@ -255,8 +258,9 @@ void writeText(FileChangeType type, WriteBuffer & out)
 struct FileChange
 {
     FileChangeType change_type{};
-    std::string new_file_path;
-    std::string old_file_path;
+    std::string path;
+    std::string old_path;
+    std::string file_extension;
     uint32_t lines_added{};
     uint32_t lines_deleted{};
     uint32_t hunks_added{};
@@ -267,9 +271,11 @@ struct FileChange
     {
         writeText(change_type, out);
         writeChar('\t', out);
-        writeText(new_file_path, out);
+        writeText(path, out);
         writeChar('\t', out);
-        writeText(old_file_path, out);
+        writeText(old_path, out);
+        writeChar('\t', out);
+        writeText(file_extension, out);
         writeChar('\t', out);
         writeText(lines_added, out);
         writeChar('\t', out);
@@ -422,11 +428,20 @@ struct Options
 };
 
 
+/// Rough snapshot of repository calculated by application of diffs. It's used to calculate blame info.
+struct File
+{
+    std::vector<LineChange> lines;
+};
+
+using Snapshot = std::map<std::string /* path */, File>;
+
+
 void processCommit(
-    const Options & options, size_t commit_num, size_t total_commits, std::string hash, Result & result)
+    const Options & options, size_t commit_num, size_t total_commits, std::string hash, Snapshot & /*snapshot*/, Result & result)
 {
     std::string command = fmt::format(
-        "git show --raw --pretty='format:%at%x09%aN%x09%aE%x09%P%x0A%s%x00' --patch --unified=0 {}",
+        "git show --raw --pretty='format:%at%x09%aN%x09%P%x0A%s%x00' --patch --unified=0 {}",
         hash);
 
     //std::cerr << command << "\n";
@@ -515,21 +530,23 @@ void processCommit(
 
         if (change_type == 'R' || change_type == 'C')
         {
-            readText(file_change.old_file_path, in);
+            readText(file_change.old_path, in);
             skipWhitespaceIfAny(in);
-            readText(file_change.new_file_path, in);
+            readText(file_change.path, in);
         }
         else
         {
-            readText(file_change.new_file_path, in);
+            readText(file_change.path, in);
         }
 
+        file_change.file_extension = std::filesystem::path(file_change.path).extension();
+
         assertChar('\n', in);
 
-        if (!(options.skip_paths && re2_st::RE2::PartialMatch(file_change.new_file_path, *options.skip_paths)))
+        if (!(options.skip_paths && re2_st::RE2::PartialMatch(file_change.path, *options.skip_paths)))
         {
             file_changes.emplace(
-                file_change.new_file_path,
+                file_change.path,
                 FileChangeAndLineChanges{ file_change, {} });
         }
     }
@@ -755,9 +772,10 @@ void processLog(const Options & options)
     size_t num_commits = hashes.size();
     fmt::print("Total {} commits to process.\n", num_commits);
 
+    Snapshot snapshot;
     for (size_t i = 0; i < num_commits; ++i)
     {
-        processCommit(options, i, num_commits, hashes[i], result);
+        processCommit(options, i, num_commits, hashes[i], snapshot, result);
     }
 }
 
@@ -792,7 +810,7 @@ try
             << "Usage: " << argv[0] << '\n'
             << desc << '\n'
             << "\nExample:\n"
-            << "\n./git-to-clickhouse --diff-size-limit 100000 --skip-paths '^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/'\n";
+            << "\n./git-to-clickhouse --diff-size-limit 100000 --skip-paths 'generated\\.cpp|^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/'\n";
         return 1;
     }
 

From d1f1326a1370abd5d837864d02851ef1b3b20745 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 6 Sep 2020 07:02:17 +0300
Subject: [PATCH 026/341] Concurrent processing + history

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 411 ++++++++++++------
 1 file changed, 283 insertions(+), 128 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index a81bc6679a7..6686c1ac480 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -4,6 +4,8 @@
 #include <algorithm>
 #include <cctype>
 #include <unordered_set>
+#include <list>
+#include <thread>
 #include <filesystem>
 
 #include <re2_st/re2.h>
@@ -80,11 +82,17 @@ CREATE TABLE git.line_changes
     hunk_num UInt32,
     hunk_start_line_number_old UInt32,
     hunk_start_line_number_new UInt32,
+    hunk_lines_added UInt32,
+    hunk_lines_deleted UInt32,
     hunk_context LowCardinality(String),
     line LowCardinality(String),
     indent UInt8,
     line_type Enum('Empty' = 0, 'Comment' = 1, 'Punct' = 2, 'Code' = 3),
 
+    prev_commit_hash String,
+    prev_author LowCardinality(String),
+    prev_time DateTime,
+
     file_change_type Enum('Add' = 1, 'Delete' = 2, 'Modify' = 3, 'Rename' = 4, 'Copy' = 5, 'Type' = 6),
     path LowCardinality(String),
     old_path LowCardinality(String),
@@ -128,6 +136,112 @@ namespace ErrorCodes
     extern const int INCORRECT_DATA;
 }
 
+
+struct Commit
+{
+    std::string hash;
+    std::string author;
+    LocalDateTime time{};
+    std::string message;
+    uint32_t files_added{};
+    uint32_t files_deleted{};
+    uint32_t files_renamed{};
+    uint32_t files_modified{};
+    uint32_t lines_added{};
+    uint32_t lines_deleted{};
+    uint32_t hunks_added{};
+    uint32_t hunks_removed{};
+    uint32_t hunks_changed{};
+
+    void writeTextWithoutNewline(WriteBuffer & out) const
+    {
+        writeText(hash, out);
+        writeChar('\t', out);
+        writeText(author, out);
+        writeChar('\t', out);
+        writeText(time, out);
+        writeChar('\t', out);
+        writeText(message, out);
+        writeChar('\t', out);
+        writeText(files_added, out);
+        writeChar('\t', out);
+        writeText(files_deleted, out);
+        writeChar('\t', out);
+        writeText(files_renamed, out);
+        writeChar('\t', out);
+        writeText(files_modified, out);
+        writeChar('\t', out);
+        writeText(lines_added, out);
+        writeChar('\t', out);
+        writeText(lines_deleted, out);
+        writeChar('\t', out);
+        writeText(hunks_added, out);
+        writeChar('\t', out);
+        writeText(hunks_removed, out);
+        writeChar('\t', out);
+        writeText(hunks_changed, out);
+    }
+};
+
+
+enum class FileChangeType
+{
+    Add,
+    Delete,
+    Modify,
+    Rename,
+    Copy,
+    Type,
+};
+
+void writeText(FileChangeType type, WriteBuffer & out)
+{
+    switch (type)
+    {
+        case FileChangeType::Add: writeString("Add", out); break;
+        case FileChangeType::Delete: writeString("Delete", out); break;
+        case FileChangeType::Modify: writeString("Modify", out); break;
+        case FileChangeType::Rename: writeString("Rename", out); break;
+        case FileChangeType::Copy: writeString("Copy", out); break;
+        case FileChangeType::Type: writeString("Type", out); break;
+    }
+}
+
+struct FileChange
+{
+    FileChangeType change_type{};
+    std::string path;
+    std::string old_path;
+    std::string file_extension;
+    uint32_t lines_added{};
+    uint32_t lines_deleted{};
+    uint32_t hunks_added{};
+    uint32_t hunks_removed{};
+    uint32_t hunks_changed{};
+
+    void writeTextWithoutNewline(WriteBuffer & out) const
+    {
+        writeText(change_type, out);
+        writeChar('\t', out);
+        writeText(path, out);
+        writeChar('\t', out);
+        writeText(old_path, out);
+        writeChar('\t', out);
+        writeText(file_extension, out);
+        writeChar('\t', out);
+        writeText(lines_added, out);
+        writeChar('\t', out);
+        writeText(lines_deleted, out);
+        writeChar('\t', out);
+        writeText(hunks_added, out);
+        writeChar('\t', out);
+        writeText(hunks_removed, out);
+        writeChar('\t', out);
+        writeText(hunks_changed, out);
+    }
+};
+
+
 enum class LineType
 {
     Empty,
@@ -155,10 +269,15 @@ struct LineChange
     uint32_t hunk_num{}; /// ordinal number of hunk in diff, starting with 0
     uint32_t hunk_start_line_number_old{};
     uint32_t hunk_start_line_number_new{};
+    uint32_t hunk_lines_added{};
+    uint32_t hunk_lines_deleted{};
     std::string hunk_context; /// The context (like a line with function name) as it is calculated by git
     std::string line; /// Line content without leading whitespaces
     uint8_t indent{}; /// The number of leading whitespaces or tabs * 4
     LineType line_type{};
+    std::string prev_commit_hash;
+    std::string prev_author;
+    LocalDateTime prev_time{};
 
     void setLineInfo(std::string full_line)
     {
@@ -220,6 +339,10 @@ struct LineChange
         writeChar('\t', out);
         writeText(hunk_start_line_number_new, out);
         writeChar('\t', out);
+        writeText(hunk_lines_added, out);
+        writeChar('\t', out);
+        writeText(hunk_lines_deleted, out);
+        writeChar('\t', out);
         writeText(hunk_context, out);
         writeChar('\t', out);
         writeText(line, out);
@@ -227,120 +350,17 @@ struct LineChange
         writeText(indent, out);
         writeChar('\t', out);
         writeText(line_type, out);
+        writeChar('\t', out);
+        writeText(prev_commit_hash, out);
+        writeChar('\t', out);
+        writeText(prev_author, out);
+        writeChar('\t', out);
+        writeText(prev_time, out);
     }
 };
 
 using LineChanges = std::vector<LineChange>;
 
-enum class FileChangeType
-{
-    Add,
-    Delete,
-    Modify,
-    Rename,
-    Copy,
-    Type,
-};
-
-void writeText(FileChangeType type, WriteBuffer & out)
-{
-    switch (type)
-    {
-        case FileChangeType::Add: writeString("Add", out); break;
-        case FileChangeType::Delete: writeString("Delete", out); break;
-        case FileChangeType::Modify: writeString("Modify", out); break;
-        case FileChangeType::Rename: writeString("Rename", out); break;
-        case FileChangeType::Copy: writeString("Copy", out); break;
-        case FileChangeType::Type: writeString("Type", out); break;
-    }
-}
-
-struct FileChange
-{
-    FileChangeType change_type{};
-    std::string path;
-    std::string old_path;
-    std::string file_extension;
-    uint32_t lines_added{};
-    uint32_t lines_deleted{};
-    uint32_t hunks_added{};
-    uint32_t hunks_removed{};
-    uint32_t hunks_changed{};
-
-    void writeTextWithoutNewline(WriteBuffer & out) const
-    {
-        writeText(change_type, out);
-        writeChar('\t', out);
-        writeText(path, out);
-        writeChar('\t', out);
-        writeText(old_path, out);
-        writeChar('\t', out);
-        writeText(file_extension, out);
-        writeChar('\t', out);
-        writeText(lines_added, out);
-        writeChar('\t', out);
-        writeText(lines_deleted, out);
-        writeChar('\t', out);
-        writeText(hunks_added, out);
-        writeChar('\t', out);
-        writeText(hunks_removed, out);
-        writeChar('\t', out);
-        writeText(hunks_changed, out);
-    }
-};
-
-struct FileChangeAndLineChanges
-{
-    FileChange file_change;
-    LineChanges line_changes;
-};
-
-struct Commit
-{
-    std::string hash;
-    std::string author;
-    time_t time{};
-    std::string message;
-    uint32_t files_added{};
-    uint32_t files_deleted{};
-    uint32_t files_renamed{};
-    uint32_t files_modified{};
-    uint32_t lines_added{};
-    uint32_t lines_deleted{};
-    uint32_t hunks_added{};
-    uint32_t hunks_removed{};
-    uint32_t hunks_changed{};
-
-    void writeTextWithoutNewline(WriteBuffer & out) const
-    {
-        writeText(hash, out);
-        writeChar('\t', out);
-        writeText(author, out);
-        writeChar('\t', out);
-        writeText(time, out);
-        writeChar('\t', out);
-        writeText(message, out);
-        writeChar('\t', out);
-        writeText(files_added, out);
-        writeChar('\t', out);
-        writeText(files_deleted, out);
-        writeChar('\t', out);
-        writeText(files_renamed, out);
-        writeChar('\t', out);
-        writeText(files_modified, out);
-        writeChar('\t', out);
-        writeText(lines_added, out);
-        writeChar('\t', out);
-        writeText(lines_deleted, out);
-        writeChar('\t', out);
-        writeText(hunks_added, out);
-        writeChar('\t', out);
-        writeText(hunks_removed, out);
-        writeChar('\t', out);
-        writeText(hunks_changed, out);
-    }
-};
-
 
 void skipUntilWhitespace(ReadBuffer & buf)
 {
@@ -407,13 +427,15 @@ struct Result
 struct Options
 {
     bool skip_commits_without_parents = true;
+    size_t threads = 1;
     std::optional<re2_st::RE2> skip_paths;
     std::unordered_set<std::string> skip_commits;
-    size_t diff_size_limit = 0;
+    std::optional<size_t> diff_size_limit;
 
     Options(const po::variables_map & options)
     {
         skip_commits_without_parents = options["skip-commits-without-parents"].as<bool>();
+        threads = options["threads"].as<size_t>();
         if (options.count("skip-paths"))
         {
             skip_paths.emplace(options["skip-paths"].as<std::string>());
@@ -423,36 +445,123 @@ struct Options
             auto vec = options["skip-commit"].as<std::vector<std::string>>();
             skip_commits.insert(vec.begin(), vec.end());
         }
-        diff_size_limit = options["diff-size-limit"].as<size_t>();
+        if (options.count("diff-size-limit"))
+        {
+            diff_size_limit = options["diff-size-limit"].as<size_t>();
+        }
     }
 };
 
 
 /// Rough snapshot of repository calculated by application of diffs. It's used to calculate blame info.
-struct File
+struct FileBlame
 {
-    std::vector<LineChange> lines;
+    using Lines = std::list<Commit>;
+    Lines lines;
+    Lines::iterator it;
+    size_t current_idx = 1;
+
+    FileBlame()
+    {
+        it = lines.begin();
+    }
+
+    FileBlame & operator=(const FileBlame & rhs)
+    {
+        lines = rhs.lines;
+        it = lines.begin();
+        current_idx = 1;
+        return *this;
+    }
+
+    FileBlame(const FileBlame & rhs)
+    {
+        *this = rhs;
+    }
+
+    void walk(uint32_t num)
+    {
+        if (current_idx < num)
+        {
+            while (current_idx < num && it != lines.end())
+            {
+                ++current_idx;
+                ++it;
+            }
+        }
+        else if (current_idx > num)
+        {
+            --current_idx;
+            --it;
+        }
+    }
+
+    const Commit * find(uint32_t num)
+    {
+        walk(num);
+
+        if (current_idx == num && it != lines.end())
+            return &*it;
+        return {};
+    }
+
+    void addLine(uint32_t num, Commit commit)
+    {
+        walk(num);
+
+        while (it == lines.end() && current_idx < num)
+        {
+            lines.emplace_back();
+            ++current_idx;
+        }
+        if (it == lines.end())
+        {
+            lines.emplace_back();
+            --it;
+        }
+
+        lines.insert(it, commit);
+    }
+
+    void removeLine(uint32_t num)
+    {
+        walk(num);
+
+        if (current_idx == num)
+            it = lines.erase(it);
+    }
 };
 
-using Snapshot = std::map<std::string /* path */, File>;
+using Snapshot = std::map<std::string /* path */, FileBlame>;
+
+struct FileChangeAndLineChanges
+{
+    FileChangeAndLineChanges(FileChange file_change_) : file_change(file_change_) {}
+
+    FileChange file_change;
+    LineChanges line_changes;
+
+    std::map<uint32_t, Commit> deleted_lines;
+};
 
 
 void processCommit(
-    const Options & options, size_t commit_num, size_t total_commits, std::string hash, Snapshot & /*snapshot*/, Result & result)
+    std::unique_ptr<ShellCommand> & commit_info,
+    const Options & options,
+    size_t commit_num,
+    size_t total_commits,
+    std::string hash,
+    Snapshot & snapshot,
+    Result & result)
 {
-    std::string command = fmt::format(
-        "git show --raw --pretty='format:%at%x09%aN%x09%P%x0A%s%x00' --patch --unified=0 {}",
-        hash);
-
-    //std::cerr << command << "\n";
-
-    auto commit_info = ShellCommand::execute(command);
     auto & in = commit_info->out;
 
     Commit commit;
     commit.hash = hash;
 
-    readText(commit.time, in);
+    time_t commit_time;
+    readText(commit_time, in);
+    commit.time = commit_time;
     assertChar('\t', in);
     readText(commit.author, in);
     assertChar('\t', in);
@@ -465,7 +574,7 @@ void processCommit(
     std::replace_if(message_to_print.begin(), message_to_print.end(), [](char c){ return std::iscntrl(c); }, ' ');
 
     fmt::print("{}%  {}  {}  {}\n",
-        commit_num * 100 / total_commits, toString(LocalDateTime(commit.time)), hash, message_to_print);
+        commit_num * 100 / total_commits, toString(commit.time), hash, message_to_print);
 
     if (options.skip_commits_without_parents && commit_num != 0 && parent_hash.empty())
     {
@@ -533,6 +642,8 @@ void processCommit(
             readText(file_change.old_path, in);
             skipWhitespaceIfAny(in);
             readText(file_change.path, in);
+
+            snapshot[file_change.path] = snapshot[file_change.old_path];
         }
         else
         {
@@ -547,7 +658,7 @@ void processCommit(
         {
             file_changes.emplace(
                 file_change.path,
-                FileChangeAndLineChanges{ file_change, {} });
+                FileChangeAndLineChanges(file_change));
         }
     }
 
@@ -601,6 +712,9 @@ void processCommit(
                     else
                         assertChar('\n', in);
 
+                    line_change.hunk_lines_added = new_lines;
+                    line_change.hunk_lines_deleted = old_lines;
+
                     ++line_change.hunk_num;
                     line_change.line_number_old = line_change.hunk_start_line_number_old;
                     line_change.line_number_new = line_change.hunk_start_line_number_new;
@@ -653,6 +767,16 @@ void processCommit(
                         readStringUntilNextLine(line_change.line, in);
                         line_change.setLineInfo(line_change.line);
 
+                        FileBlame & file_snapshot = snapshot[old_file_path];
+                        if (const Commit * prev_commit = file_snapshot.find(line_change.line_number_old))
+                        {
+                            line_change.prev_commit_hash = prev_commit->hash;
+                            line_change.prev_author = prev_commit->author;
+                            line_change.prev_time = prev_commit->time;
+                            file_change_and_line_changes->deleted_lines[line_change.line_number_old] = *prev_commit;
+                            file_snapshot.removeLine(line_change.line_number_old);
+                        }
+
                         file_change_and_line_changes->line_changes.push_back(line_change);
                         ++line_change.line_number_old;
                     }
@@ -689,6 +813,16 @@ void processCommit(
                         readStringUntilNextLine(line_change.line, in);
                         line_change.setLineInfo(line_change.line);
 
+                        FileBlame & file_snapshot = snapshot[new_file_path];
+                        if (file_change_and_line_changes->deleted_lines.count(line_change.line_number_new))
+                        {
+                            const auto & prev_commit = file_change_and_line_changes->deleted_lines[line_change.line_number_new];
+                            line_change.prev_commit_hash = prev_commit.hash;
+                            line_change.prev_author = prev_commit.author;
+                            line_change.prev_time = prev_commit.time;
+                        }
+                        file_snapshot.addLine(line_change.line_number_new, commit);
+
                         file_change_and_line_changes->line_changes.push_back(line_change);
                         ++line_change.line_number_new;
                     }
@@ -701,7 +835,7 @@ void processCommit(
         }
     }
 
-    if (commit.lines_added + commit.lines_deleted > options.diff_size_limit)
+    if (options.diff_size_limit && commit.lines_added + commit.lines_deleted > *options.diff_size_limit)
         return;
 
     /// Write the result
@@ -744,6 +878,16 @@ void processCommit(
 }
 
 
+auto gitShow(const std::string & hash)
+{
+    std::string command = fmt::format(
+        "git show --raw --pretty='format:%at%x09%aN%x09%P%x0A%s%x00' --patch --unified=0 {}",
+        hash);
+
+    return ShellCommand::execute(command);
+}
+
+
 void processLog(const Options & options)
 {
     Result result;
@@ -772,10 +916,19 @@ void processLog(const Options & options)
     size_t num_commits = hashes.size();
     fmt::print("Total {} commits to process.\n", num_commits);
 
+    /// Will run multiple processes in parallel
+    size_t num_threads = options.threads;
+
+    std::vector<std::unique_ptr<ShellCommand>> show_commands(num_threads);
+    for (size_t i = 0; i < num_commits && i < num_threads; ++i)
+        show_commands[i] = gitShow(hashes[i]);
+
     Snapshot snapshot;
     for (size_t i = 0; i < num_commits; ++i)
     {
-        processCommit(options, i, num_commits, hashes[i], snapshot, result);
+        processCommit(show_commands[i % num_threads], options, i, num_commits, hashes[i], snapshot, result);
+        if (i + num_threads < num_commits)
+            show_commands[i % num_threads] = gitShow(hashes[i + num_threads]);
     }
 }
 
@@ -797,8 +950,10 @@ try
             "Skip paths that matches regular expression (re2 syntax).")
         ("skip-commit", po::value<std::vector<std::string>>(),
             "Skip commit with specified hash. The option can be specified multiple times.")
-        ("diff-size-limit", po::value<size_t>()->default_value(0),
+        ("diff-size-limit", po::value<size_t>(),
             "Skip commits whose diff size (number of added + removed lines) is larger than specified threshold")
+        ("threads", po::value<size_t>()->default_value(std::thread::hardware_concurrency()),
+            "Number of threads to interact with git")
     ;
 
     po::variables_map options;

From 3f29453c02ef3d3716927d81258218516b183d7b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 6 Sep 2020 09:38:48 +0300
Subject: [PATCH 027/341] Roughly working blame

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 179 ++++++++++++++----
 1 file changed, 137 insertions(+), 42 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 6686c1ac480..c1c27a82812 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -4,6 +4,7 @@
 #include <algorithm>
 #include <cctype>
 #include <unordered_set>
+#include <unordered_map>
 #include <list>
 #include <thread>
 #include <filesystem>
@@ -13,6 +14,7 @@
 #include <boost/program_options.hpp>
 
 #include <Common/Exception.h>
+#include <Common/SipHash.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/ShellCommand.h>
 #include <common/find_symbols.h>
@@ -427,19 +429,26 @@ struct Result
 struct Options
 {
     bool skip_commits_without_parents = true;
+    bool skip_commits_with_duplicate_diffs = true;
     size_t threads = 1;
     std::optional<re2_st::RE2> skip_paths;
+    std::optional<re2_st::RE2> skip_commits_with_messages;
     std::unordered_set<std::string> skip_commits;
     std::optional<size_t> diff_size_limit;
 
     Options(const po::variables_map & options)
     {
         skip_commits_without_parents = options["skip-commits-without-parents"].as<bool>();
+        skip_commits_with_duplicate_diffs = options["skip-commits-with-duplicate-diffs"].as<bool>();
         threads = options["threads"].as<size_t>();
         if (options.count("skip-paths"))
         {
             skip_paths.emplace(options["skip-paths"].as<std::string>());
         }
+        if (options.count("skip-commits-with-messages"))
+        {
+            skip_commits_with_messages.emplace(options["skip-commits-with-messages"].as<std::string>());
+        }
         if (options.count("skip-commit"))
         {
             auto vec = options["skip-commit"].as<std::vector<std::string>>();
@@ -481,15 +490,12 @@ struct FileBlame
 
     void walk(uint32_t num)
     {
-        if (current_idx < num)
+        while (current_idx < num && it != lines.end())
         {
-            while (current_idx < num && it != lines.end())
-            {
-                ++current_idx;
-                ++it;
-            }
+            ++current_idx;
+            ++it;
         }
-        else if (current_idx > num)
+        while (current_idx > num)
         {
             --current_idx;
             --it;
@@ -500,6 +506,8 @@ struct FileBlame
     {
         walk(num);
 
+//        std::cerr << "current_idx: " << current_idx << ", num: " << num << "\n";
+
         if (current_idx == num && it != lines.end())
             return &*it;
         return {};
@@ -514,20 +522,17 @@ struct FileBlame
             lines.emplace_back();
             ++current_idx;
         }
-        if (it == lines.end())
-        {
-            lines.emplace_back();
-            --it;
-        }
 
-        lines.insert(it, commit);
+        it = lines.insert(it, commit);
     }
 
     void removeLine(uint32_t num)
     {
+//        std::cerr << "Removing line " << num << ", current_idx: " << current_idx << "\n";
+
         walk(num);
 
-        if (current_idx == num)
+        if (current_idx == num && it != lines.end())
             it = lines.erase(it);
     }
 };
@@ -540,10 +545,10 @@ struct FileChangeAndLineChanges
 
     FileChange file_change;
     LineChanges line_changes;
-
-    std::map<uint32_t, Commit> deleted_lines;
 };
 
+using DiffHashes = std::unordered_set<UInt128>;
+
 
 void processCommit(
     std::unique_ptr<ShellCommand> & commit_info,
@@ -552,6 +557,7 @@ void processCommit(
     size_t total_commits,
     std::string hash,
     Snapshot & snapshot,
+    DiffHashes & diff_hashes,
     Result & result)
 {
     auto & in = commit_info->out;
@@ -570,6 +576,9 @@ void processCommit(
     assertChar('\n', in);
     readNullTerminated(commit.message, in);
 
+    if (options.skip_commits_with_messages && re2_st::RE2::PartialMatch(commit.message, *options.skip_commits_with_messages))
+        return;
+
     std::string message_to_print = commit.message;
     std::replace_if(message_to_print.begin(), message_to_print.end(), [](char c){ return std::iscntrl(c); }, ' ');
 
@@ -643,7 +652,10 @@ void processCommit(
             skipWhitespaceIfAny(in);
             readText(file_change.path, in);
 
-            snapshot[file_change.path] = snapshot[file_change.old_path];
+//            std::cerr << "Move from " << file_change.old_path << " to " << file_change.path << "\n";
+
+            if (file_change.path != file_change.old_path)
+                snapshot[file_change.path] = snapshot[file_change.old_path];
         }
         else
         {
@@ -706,6 +718,9 @@ void processCommit(
                     if (checkChar(',', in))
                         readText(new_lines, in);
 
+                    if (line_change.hunk_start_line_number_new == 0)
+                        line_change.hunk_start_line_number_new = 1;
+
                     assertString(" @@", in);
                     if (checkChar(' ', in))
                         readStringUntilNextLine(line_change.hunk_context, in);
@@ -767,16 +782,6 @@ void processCommit(
                         readStringUntilNextLine(line_change.line, in);
                         line_change.setLineInfo(line_change.line);
 
-                        FileBlame & file_snapshot = snapshot[old_file_path];
-                        if (const Commit * prev_commit = file_snapshot.find(line_change.line_number_old))
-                        {
-                            line_change.prev_commit_hash = prev_commit->hash;
-                            line_change.prev_author = prev_commit->author;
-                            line_change.prev_time = prev_commit->time;
-                            file_change_and_line_changes->deleted_lines[line_change.line_number_old] = *prev_commit;
-                            file_snapshot.removeLine(line_change.line_number_old);
-                        }
-
                         file_change_and_line_changes->line_changes.push_back(line_change);
                         ++line_change.line_number_old;
                     }
@@ -813,16 +818,6 @@ void processCommit(
                         readStringUntilNextLine(line_change.line, in);
                         line_change.setLineInfo(line_change.line);
 
-                        FileBlame & file_snapshot = snapshot[new_file_path];
-                        if (file_change_and_line_changes->deleted_lines.count(line_change.line_number_new))
-                        {
-                            const auto & prev_commit = file_change_and_line_changes->deleted_lines[line_change.line_number_new];
-                            line_change.prev_commit_hash = prev_commit.hash;
-                            line_change.prev_author = prev_commit.author;
-                            line_change.prev_time = prev_commit.time;
-                        }
-                        file_snapshot.addLine(line_change.line_number_new, commit);
-
                         file_change_and_line_changes->line_changes.push_back(line_change);
                         ++line_change.line_number_new;
                     }
@@ -838,6 +833,99 @@ void processCommit(
     if (options.diff_size_limit && commit.lines_added + commit.lines_deleted > *options.diff_size_limit)
         return;
 
+    /// Calculate hash of diff and skip duplicates
+    if (options.skip_commits_with_duplicate_diffs)
+    {
+        SipHash hasher;
+
+        for (auto & elem : file_changes)
+        {
+            hasher.update(elem.second.file_change.change_type);
+            hasher.update(elem.second.file_change.old_path.size());
+            hasher.update(elem.second.file_change.old_path);
+            hasher.update(elem.second.file_change.path.size());
+            hasher.update(elem.second.file_change.path);
+
+            hasher.update(elem.second.line_changes.size());
+            for (auto & line_change : elem.second.line_changes)
+            {
+                hasher.update(line_change.sign);
+                hasher.update(line_change.line_number_old);
+                hasher.update(line_change.line_number_new);
+                hasher.update(line_change.indent);
+                hasher.update(line_change.line.size());
+                hasher.update(line_change.line);
+            }
+        }
+
+        UInt128 hash_of_diff;
+        hasher.get128(hash_of_diff.low, hash_of_diff.high);
+
+        if (!diff_hashes.insert(hash_of_diff).second)
+            return;
+    }
+
+    /// Update snapshot and blame info
+
+    for (auto & elem : file_changes)
+    {
+//        std::cerr << elem.first << "\n";
+
+        FileBlame & file_snapshot = snapshot[elem.first];
+        std::unordered_map<uint32_t, Commit> deleted_lines;
+
+        /// Obtain blame info from previous state of the snapshot
+
+        for (auto & line_change : elem.second.line_changes)
+        {
+            if (line_change.sign == -1)
+            {
+                if (const Commit * prev_commit = file_snapshot.find(line_change.line_number_old);
+                    prev_commit && prev_commit->time <= commit.time)
+                {
+                    line_change.prev_commit_hash = prev_commit->hash;
+                    line_change.prev_author = prev_commit->author;
+                    line_change.prev_time = prev_commit->time;
+                    deleted_lines[line_change.line_number_old] = *prev_commit;
+                }
+                else
+                {
+                    // std::cerr << "Did not find line " << line_change.line_number_old << " from file " << elem.first << ": " << line_change.line << "\n";
+                }
+            }
+            else if (line_change.sign == 1)
+            {
+                uint32_t this_line_in_prev_commit = line_change.hunk_start_line_number_old
+                    + (line_change.line_number_new - line_change.hunk_start_line_number_new);
+
+                if (deleted_lines.count(this_line_in_prev_commit))
+                {
+                    const auto & prev_commit = deleted_lines[this_line_in_prev_commit];
+                    if (prev_commit.time <= commit.time)
+                    {
+                        line_change.prev_commit_hash = prev_commit.hash;
+                        line_change.prev_author = prev_commit.author;
+                        line_change.prev_time = prev_commit.time;
+                    }
+                }
+            }
+        }
+
+        /// Update the snapshot
+
+        for (const auto & line_change : elem.second.line_changes)
+        {
+            if (line_change.sign == -1)
+            {
+                file_snapshot.removeLine(line_change.line_number_new);
+            }
+            else if (line_change.sign == 1)
+            {
+                file_snapshot.addLine(line_change.line_number_new, commit);
+            }
+        }
+    }
+
     /// Write the result
 
     /// commits table
@@ -881,7 +969,7 @@ void processCommit(
 auto gitShow(const std::string & hash)
 {
     std::string command = fmt::format(
-        "git show --raw --pretty='format:%at%x09%aN%x09%P%x0A%s%x00' --patch --unified=0 {}",
+        "git show --raw --pretty='format:%ct%x09%aN%x09%P%x0A%s%x00' --patch --unified=0 {}",
         hash);
 
     return ShellCommand::execute(command);
@@ -924,9 +1012,11 @@ void processLog(const Options & options)
         show_commands[i] = gitShow(hashes[i]);
 
     Snapshot snapshot;
+    DiffHashes diff_hashes;
+
     for (size_t i = 0; i < num_commits; ++i)
     {
-        processCommit(show_commands[i % num_threads], options, i, num_commits, hashes[i], snapshot, result);
+        processCommit(show_commands[i % num_threads], options, i, num_commits, hashes[i], snapshot, diff_hashes, result);
         if (i + num_threads < num_commits)
             show_commands[i % num_threads] = gitShow(hashes[i + num_threads]);
     }
@@ -946,10 +1036,15 @@ try
         ("skip-commits-without-parents", po::value<bool>()->default_value(true),
             "Skip commits without parents (except the initial commit)."
             " These commits are usually erroneous but they can make sense in very rare cases.")
-        ("skip-paths", po::value<std::string>(),
-            "Skip paths that matches regular expression (re2 syntax).")
+        ("skip-commits-with-duplicate-diffs", po::value<bool>()->default_value(true),
+            "Skip commits with duplicate diffs."
+            " These commits are usually results of cherry-pick or merge after rebase.")
         ("skip-commit", po::value<std::vector<std::string>>(),
             "Skip commit with specified hash. The option can be specified multiple times.")
+        ("skip-paths", po::value<std::string>(),
+            "Skip paths that matches regular expression (re2 syntax).")
+        ("skip-commits-with-messages", po::value<std::string>(),
+            "Skip commits whose messages matches regular expression (re2 syntax).")
         ("diff-size-limit", po::value<size_t>(),
             "Skip commits whose diff size (number of added + removed lines) is larger than specified threshold")
         ("threads", po::value<size_t>()->default_value(std::thread::hardware_concurrency()),
@@ -965,7 +1060,7 @@ try
             << "Usage: " << argv[0] << '\n'
             << desc << '\n'
             << "\nExample:\n"
-            << "\n./git-to-clickhouse --diff-size-limit 100000 --skip-paths 'generated\\.cpp|^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/'\n";
+            << "\n./git-to-clickhouse --diff-size-limit 100000 --skip-paths 'generated\\.cpp|^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/' --skip-commits-with-messages '^Merge branch '\n";
         return 1;
     }
 

From 99c33612d65c627bbb9fc31d9d97906195d3cf53 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 6 Sep 2020 10:29:58 +0300
Subject: [PATCH 028/341] Better diagnostics

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index c1c27a82812..6b29708ead3 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -582,7 +582,7 @@ void processCommit(
     std::string message_to_print = commit.message;
     std::replace_if(message_to_print.begin(), message_to_print.end(), [](char c){ return std::iscntrl(c); }, ' ');
 
-    fmt::print("{}%  {}  {}  {}\n",
+    std::cerr << fmt::format("{}%  {}  {}  {}\n",
         commit_num * 100 / total_commits, toString(commit.time), hash, message_to_print);
 
     if (options.skip_commits_without_parents && commit_num != 0 && parent_hash.empty())

From 3ec9656aa21a3142d2898b7d259a4740a6691fd2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 6 Sep 2020 10:38:39 +0300
Subject: [PATCH 029/341] Slightly more robust

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 10 ++++------
 1 file changed, 4 insertions(+), 6 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 6b29708ead3..f3653bb282f 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -568,12 +568,10 @@ void processCommit(
     time_t commit_time;
     readText(commit_time, in);
     commit.time = commit_time;
-    assertChar('\t', in);
-    readText(commit.author, in);
-    assertChar('\t', in);
+    assertChar('\0', in);
+    readNullTerminated(commit.author, in);
     std::string parent_hash;
-    readString(parent_hash, in);
-    assertChar('\n', in);
+    readNullTerminated(parent_hash, in);
     readNullTerminated(commit.message, in);
 
     if (options.skip_commits_with_messages && re2_st::RE2::PartialMatch(commit.message, *options.skip_commits_with_messages))
@@ -969,7 +967,7 @@ void processCommit(
 auto gitShow(const std::string & hash)
 {
     std::string command = fmt::format(
-        "git show --raw --pretty='format:%ct%x09%aN%x09%P%x0A%s%x00' --patch --unified=0 {}",
+        "git show --raw --pretty='format:%ct%x00%aN%x00%P%x00%s%x00' --patch --unified=0 {}",
         hash);
 
     return ShellCommand::execute(command);

From 25ca5e91bd0f3074c8d7d0874e125d2dcc611889 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Sat, 5 Sep 2020 16:09:32 -0700
Subject: [PATCH 030/341] AsynchronousMetricLog - add event_time_microseconds
 column

---
 src/Core/Field.h                           |  3 ++-
 src/Interpreters/AsynchronousMetricLog.cpp | 17 +++++++++++++----
 src/Interpreters/AsynchronousMetricLog.h   |  1 +
 3 files changed, 16 insertions(+), 5 deletions(-)

diff --git a/src/Core/Field.h b/src/Core/Field.h
index 0bfdf597543..8973d106c0b 100644
--- a/src/Core/Field.h
+++ b/src/Core/Field.h
@@ -768,7 +768,8 @@ T & Field::get()
     // Disregard signedness when converting between int64 types.
     constexpr Field::Types::Which target = TypeToEnum<NearestFieldType<ValueType>>::value;
     assert(target == which
-           || (isInt64FieldType(target) && isInt64FieldType(which)));
+           || (isInt64FieldType(target) && isInt64FieldType(which))
+           || target == Field::Types::Decimal64 /* DateTime64 fields */);
 #endif
 
     ValueType * MAY_ALIAS ptr = reinterpret_cast<ValueType *>(&storage);
diff --git a/src/Interpreters/AsynchronousMetricLog.cpp b/src/Interpreters/AsynchronousMetricLog.cpp
index e4415773655..d2c81c9dfc5 100644
--- a/src/Interpreters/AsynchronousMetricLog.cpp
+++ b/src/Interpreters/AsynchronousMetricLog.cpp
@@ -2,6 +2,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeDateTime64.h>
 #include <DataTypes/DataTypeString.h>
 #include <Interpreters/AsynchronousMetrics.h>
 
@@ -13,10 +14,11 @@ Block AsynchronousMetricLogElement::createBlock()
 {
     ColumnsWithTypeAndName columns;
 
-    columns.emplace_back(std::make_shared<DataTypeDate>(),      "event_date");
-    columns.emplace_back(std::make_shared<DataTypeDateTime>(),  "event_time");
-    columns.emplace_back(std::make_shared<DataTypeString>(),    "name");
-    columns.emplace_back(std::make_shared<DataTypeFloat64>(),   "value");
+    columns.emplace_back(std::make_shared<DataTypeDate>(),          "event_date");
+    columns.emplace_back(std::make_shared<DataTypeDateTime>(),      "event_time");
+    columns.emplace_back(std::make_shared<DataTypeDateTime64>(6),   "event_time_microseconds");
+    columns.emplace_back(std::make_shared<DataTypeString>(),        "name");
+    columns.emplace_back(std::make_shared<DataTypeFloat64>(),       "value");
 
     return Block(columns);
 }
@@ -28,6 +30,7 @@ void AsynchronousMetricLogElement::appendToBlock(MutableColumns & columns) const
 
     columns[column_idx++]->insert(event_date);
     columns[column_idx++]->insert(event_time);
+    columns[column_idx++]->insert(event_time_microseconds);
     columns[column_idx++]->insert(metric_name);
     columns[column_idx++]->insert(value);
 }
@@ -38,6 +41,11 @@ inline UInt64 time_in_milliseconds(std::chrono::time_point<std::chrono::system_c
     return std::chrono::duration_cast<std::chrono::milliseconds>(timepoint.time_since_epoch()).count();
 }
 
+inline UInt64 time_in_microseconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::microseconds>(timepoint.time_since_epoch()).count();
+}
+
 
 inline UInt64 time_in_seconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
 {
@@ -50,6 +58,7 @@ void AsynchronousMetricLog::addValues(const AsynchronousMetricValues & values)
 
     const auto now = std::chrono::system_clock::now();
     element.event_time = time_in_seconds(now);
+    element.event_time_microseconds = time_in_microseconds(now);
     element.event_date = DateLUT::instance().toDayNum(element.event_time);
 
     for (const auto & [key, value] : values)
diff --git a/src/Interpreters/AsynchronousMetricLog.h b/src/Interpreters/AsynchronousMetricLog.h
index b7d6aab95b6..0c02244246e 100644
--- a/src/Interpreters/AsynchronousMetricLog.h
+++ b/src/Interpreters/AsynchronousMetricLog.h
@@ -22,6 +22,7 @@ struct AsynchronousMetricLogElement
 {
     UInt16 event_date;
     time_t event_time;
+    UInt64 event_time_microseconds;
     std::string metric_name;
     double value;
 

From 6a5b885ac1167dd8bba4a0c8b091289dd4c1e79e Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Sat, 5 Sep 2020 16:17:28 -0700
Subject: [PATCH 031/341] AsynchronousMetricLog - add tests for
 event_time_microseconds column

---
 .../0_stateless/01473_event_time_microseconds.reference      | 2 ++
 tests/queries/0_stateless/01473_event_time_microseconds.sql  | 5 +++++
 2 files changed, 7 insertions(+)
 create mode 100644 tests/queries/0_stateless/01473_event_time_microseconds.reference
 create mode 100644 tests/queries/0_stateless/01473_event_time_microseconds.sql

diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.reference b/tests/queries/0_stateless/01473_event_time_microseconds.reference
new file mode 100644
index 00000000000..6c3b6ec5c6c
--- /dev/null
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.reference
@@ -0,0 +1,2 @@
+'01473_asynchronous_metric_log_event_start_time_milliseconds_test'
+ok
\ No newline at end of file
diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.sql b/tests/queries/0_stateless/01473_event_time_microseconds.sql
new file mode 100644
index 00000000000..af38cf4ca70
--- /dev/null
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.sql
@@ -0,0 +1,5 @@
+set log_queries = 1;
+
+select '01473_asynchronous_metric_log_event_start_time_milliseconds_test';
+system flush logs;
+SELECT If((select count(event_time_microseconds)  from system.asynchronous_metric_log) > 0, 'ok', 'fail'); -- success

From 1c1f50c6b665b96d7ba5742a60c770081299213d Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Sat, 5 Sep 2020 16:19:38 -0700
Subject: [PATCH 032/341] MetricLog - add event_time_microseconds column

---
 src/Interpreters/MetricLog.cpp | 14 +++++++++++---
 src/Interpreters/MetricLog.h   |  1 +
 2 files changed, 12 insertions(+), 3 deletions(-)

diff --git a/src/Interpreters/MetricLog.cpp b/src/Interpreters/MetricLog.cpp
index 69fcc4917b9..ce5d5793b87 100644
--- a/src/Interpreters/MetricLog.cpp
+++ b/src/Interpreters/MetricLog.cpp
@@ -2,6 +2,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeDateTime64.h>
 
 
 namespace DB
@@ -11,9 +12,10 @@ Block MetricLogElement::createBlock()
 {
     ColumnsWithTypeAndName columns_with_type_and_name;
 
-    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeDate>(),     "event_date");
-    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeDateTime>(), "event_time");
-    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeUInt64>(),   "milliseconds");
+    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeDate>(),           "event_date");
+    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeDateTime>(),       "event_time");
+    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeDateTime64>(6),    "event_time_microseconds");
+    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeUInt64>(),         "milliseconds");
 
     for (size_t i = 0, end = ProfileEvents::end(); i < end; ++i)
     {
@@ -41,6 +43,7 @@ void MetricLogElement::appendToBlock(MutableColumns & columns) const
 
     columns[column_idx++]->insert(DateLUT::instance().toDayNum(event_time));
     columns[column_idx++]->insert(event_time);
+    columns[column_idx++]->insert(event_time_microseconds);
     columns[column_idx++]->insert(milliseconds);
 
     for (size_t i = 0, end = ProfileEvents::end(); i < end; ++i)
@@ -80,6 +83,10 @@ inline UInt64 time_in_milliseconds(std::chrono::time_point<std::chrono::system_c
     return std::chrono::duration_cast<std::chrono::milliseconds>(timepoint.time_since_epoch()).count();
 }
 
+inline UInt64 time_in_microseconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::microseconds>(timepoint.time_since_epoch()).count();
+}
 
 inline UInt64 time_in_seconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
 {
@@ -102,6 +109,7 @@ void MetricLog::metricThreadFunction()
 
             MetricLogElement elem;
             elem.event_time = std::chrono::system_clock::to_time_t(current_time);
+            elem.event_time_microseconds = time_in_microseconds(current_time);
             elem.milliseconds = time_in_milliseconds(current_time) - time_in_seconds(current_time) * 1000;
 
             elem.profile_events.resize(ProfileEvents::end());
diff --git a/src/Interpreters/MetricLog.h b/src/Interpreters/MetricLog.h
index 7774a45d7e1..f52d078bdc9 100644
--- a/src/Interpreters/MetricLog.h
+++ b/src/Interpreters/MetricLog.h
@@ -18,6 +18,7 @@ namespace DB
 struct MetricLogElement
 {
     time_t event_time{};
+    UInt64 event_time_microseconds{};
     UInt64 milliseconds{};
 
     std::vector<ProfileEvents::Count> profile_events;

From ec0d0243cc994f91fcc8a6a0fd36bde22f853af5 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Sat, 5 Sep 2020 16:21:51 -0700
Subject: [PATCH 033/341] MetricLog - add tests for event_time_microseconds
 field

---
 .../0_stateless/01473_event_time_microseconds.reference     | 6 ++++--
 tests/queries/0_stateless/01473_event_time_microseconds.sql | 4 ++++
 2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.reference b/tests/queries/0_stateless/01473_event_time_microseconds.reference
index 6c3b6ec5c6c..cac87f32a29 100644
--- a/tests/queries/0_stateless/01473_event_time_microseconds.reference
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.reference
@@ -1,2 +1,4 @@
-'01473_asynchronous_metric_log_event_start_time_milliseconds_test'
-ok
\ No newline at end of file
+01473_asynchronous_metric_log_event_start_time_milliseconds_test
+ok
+01473_metric_log_event_start_time_milliseconds_test
+ok
diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.sql b/tests/queries/0_stateless/01473_event_time_microseconds.sql
index af38cf4ca70..6a13d6e1543 100644
--- a/tests/queries/0_stateless/01473_event_time_microseconds.sql
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.sql
@@ -3,3 +3,7 @@ set log_queries = 1;
 select '01473_asynchronous_metric_log_event_start_time_milliseconds_test';
 system flush logs;
 SELECT If((select count(event_time_microseconds)  from system.asynchronous_metric_log) > 0, 'ok', 'fail'); -- success
+
+select '01473_metric_log_event_start_time_milliseconds_test';
+system flush logs;
+SELECT If((select count(event_time_microseconds)  from system.metric_log) > 0, 'ok', 'fail'); -- success

From 9de49d130f733c0fcc00d8f7bd85c4fb2eecbfc2 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Sat, 5 Sep 2020 16:36:38 -0700
Subject: [PATCH 034/341] AsynchronousMetricLog & MetricLog - update docs with
 examples

---
 .../system-tables/asynchronous_metric_log.md  | 25 ++++++------
 .../en/operations/system-tables/metric_log.md | 40 +++++++++----------
 2 files changed, 33 insertions(+), 32 deletions(-)

diff --git a/docs/en/operations/system-tables/asynchronous_metric_log.md b/docs/en/operations/system-tables/asynchronous_metric_log.md
index 6b1d71e1ca6..75607cc30b0 100644
--- a/docs/en/operations/system-tables/asynchronous_metric_log.md
+++ b/docs/en/operations/system-tables/asynchronous_metric_log.md
@@ -6,6 +6,7 @@ Columns:
 
 -   `event_date` ([Date](../../sql-reference/data-types/date.md)) — Event date.
 -   `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Event time.
+-   `event_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — Event time with microseconds resolution.
 -   `name` ([String](../../sql-reference/data-types/string.md)) — Metric name.
 -   `value` ([Float64](../../sql-reference/data-types/float.md)) — Metric value.
 
@@ -16,18 +17,18 @@ SELECT * FROM system.asynchronous_metric_log LIMIT 10
 ```
 
 ``` text
-┌─event_date─┬──────────event_time─┬─name─────────────────────────────────────┬────value─┐
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.arenas.all.pmuzzy               │        0 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.arenas.all.pdirty               │     4214 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.background_thread.run_intervals │        0 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.background_thread.num_runs      │        0 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.retained                        │ 17657856 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.mapped                          │ 71471104 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.resident                        │ 61538304 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.metadata                        │  6199264 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.allocated                       │ 38074336 │
-│ 2020-06-22 │ 2020-06-22 06:57:30 │ jemalloc.epoch                           │        2 │
-└────────────┴─────────────────────┴──────────────────────────────────────────┴──────────┘
+┌─event_date─┬──────────event_time─┬────event_time_microseconds─┬─name─────────────────────────────────────┬─────value─┐
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ CPUFrequencyMHz_0                        │    2120.9 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.arenas.all.pmuzzy               │       743 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.arenas.all.pdirty               │     26288 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.background_thread.run_intervals │         0 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.background_thread.num_runs      │         0 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.retained                        │  60694528 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.mapped                          │ 303161344 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.resident                        │ 260931584 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.metadata                        │  12079488 │
+│ 2020-09-05 │ 2020-09-05 15:56:30 │ 2020-09-05 15:56:30.025227 │ jemalloc.allocated                       │ 133756128 │
+└────────────┴─────────────────────┴────────────────────────────┴──────────────────────────────────────────┴───────────┘
 ```
 
 **See Also**
diff --git a/docs/en/operations/system-tables/metric_log.md b/docs/en/operations/system-tables/metric_log.md
index 9ccf61291d2..063fe81923b 100644
--- a/docs/en/operations/system-tables/metric_log.md
+++ b/docs/en/operations/system-tables/metric_log.md
@@ -23,28 +23,28 @@ SELECT * FROM system.metric_log LIMIT 1 FORMAT Vertical;
 ``` text
 Row 1:
 ──────
-event_date:                                                 2020-02-18
-event_time:                                                 2020-02-18 07:15:33
-milliseconds:                                               554
-ProfileEvent_Query:                                         0
-ProfileEvent_SelectQuery:                                   0
-ProfileEvent_InsertQuery:                                   0
-ProfileEvent_FileOpen:                                      0
-ProfileEvent_Seek:                                          0
-ProfileEvent_ReadBufferFromFileDescriptorRead:              1
-ProfileEvent_ReadBufferFromFileDescriptorReadFailed:        0
-ProfileEvent_ReadBufferFromFileDescriptorReadBytes:         0
-ProfileEvent_WriteBufferFromFileDescriptorWrite:            1
-ProfileEvent_WriteBufferFromFileDescriptorWriteFailed:      0
-ProfileEvent_WriteBufferFromFileDescriptorWriteBytes:       56
+event_date:                                                      2020-09-05
+event_time:                                                      2020-09-05 16:22:33
+event_time_microseconds:                                         2020-09-05 16:22:33.196807
+milliseconds:                                                    196
+ProfileEvent_Query:                                              0
+ProfileEvent_SelectQuery:                                        0
+ProfileEvent_InsertQuery:                                        0
+ProfileEvent_FailedQuery:                                        0
+ProfileEvent_FailedSelectQuery:                                  0
 ...
-CurrentMetric_Query:                                        0
-CurrentMetric_Merge:                                        0
-CurrentMetric_PartMutation:                                 0
-CurrentMetric_ReplicatedFetch:                              0
-CurrentMetric_ReplicatedSend:                               0
-CurrentMetric_ReplicatedChecks:                             0
 ...
+CurrentMetric_Revision:                                          54439
+CurrentMetric_VersionInteger:                                    20009001
+CurrentMetric_RWLockWaitingReaders:                              0
+CurrentMetric_RWLockWaitingWriters:                              0
+CurrentMetric_RWLockActiveReaders:                               0
+CurrentMetric_RWLockActiveWriters:                               0
+CurrentMetric_GlobalThread:                                      74
+CurrentMetric_GlobalThreadActive:                                26
+CurrentMetric_LocalThread:                                       0
+CurrentMetric_LocalThreadActive:                                 0
+CurrentMetric_DistributedFilesToInsert:                          0
 ```
 
 **See also**

From db58fa15aaf202318e043549440589797b51aa0a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 02:24:31 +0300
Subject: [PATCH 035/341] Some tweaks

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 21 ++++++++++++++-----
 1 file changed, 16 insertions(+), 5 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index f3653bb282f..9e1ef14fcbf 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -435,6 +435,7 @@ struct Options
     std::optional<re2_st::RE2> skip_commits_with_messages;
     std::unordered_set<std::string> skip_commits;
     std::optional<size_t> diff_size_limit;
+    std::string stop_after_commit;
 
     Options(const po::variables_map & options)
     {
@@ -458,6 +459,10 @@ struct Options
         {
             diff_size_limit = options["diff-size-limit"].as<size_t>();
         }
+        if (options.count("stop-after-commit"))
+        {
+            stop_after_commit = options["stop-after-commit"].as<std::string>();
+        }
     }
 };
 
@@ -828,7 +833,7 @@ void processCommit(
         }
     }
 
-    if (options.diff_size_limit && commit.lines_added + commit.lines_deleted > *options.diff_size_limit)
+    if (options.diff_size_limit && commit_num != 0 && commit.lines_added + commit.lines_deleted > *options.diff_size_limit)
         return;
 
     /// Calculate hash of diff and skip duplicates
@@ -1015,6 +1020,10 @@ void processLog(const Options & options)
     for (size_t i = 0; i < num_commits; ++i)
     {
         processCommit(show_commands[i % num_threads], options, i, num_commits, hashes[i], snapshot, diff_hashes, result);
+
+        if (!options.stop_after_commit.empty() && hashes[i] == options.stop_after_commit)
+            break;
+
         if (i + num_threads < num_commits)
             show_commands[i % num_threads] = gitShow(hashes[i + num_threads]);
     }
@@ -1043,10 +1052,12 @@ try
             "Skip paths that matches regular expression (re2 syntax).")
         ("skip-commits-with-messages", po::value<std::string>(),
             "Skip commits whose messages matches regular expression (re2 syntax).")
-        ("diff-size-limit", po::value<size_t>(),
-            "Skip commits whose diff size (number of added + removed lines) is larger than specified threshold")
+        ("diff-size-limit", po::value<size_t>()->default_value(100000),
+            "Skip commits whose diff size (number of added + removed lines) is larger than specified threshold. Does not apply for initial commit.")
+        ("stop-after-commit", po::value<std::string>(),
+            "Stop processing after specified commit hash.")
         ("threads", po::value<size_t>()->default_value(std::thread::hardware_concurrency()),
-            "Number of threads to interact with git")
+            "Number of concurrent git subprocesses to spawn")
     ;
 
     po::variables_map options;
@@ -1058,7 +1069,7 @@ try
             << "Usage: " << argv[0] << '\n'
             << desc << '\n'
             << "\nExample:\n"
-            << "\n./git-to-clickhouse --diff-size-limit 100000 --skip-paths 'generated\\.cpp|^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/' --skip-commits-with-messages '^Merge branch '\n";
+            << "\n./git-to-clickhouse --skip-paths 'generated\\.cpp|^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/' --skip-commits-with-messages '^Merge branch '\n";
         return 1;
     }
 

From 684a910395cc37203453d1faa09ab839d3a4f32a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 03:17:26 +0300
Subject: [PATCH 036/341] Polish

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 803 ++++++++++--------
 1 file changed, 451 insertions(+), 352 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 9e1ef14fcbf..6e43853d6ba 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -277,10 +277,14 @@ struct LineChange
     std::string line; /// Line content without leading whitespaces
     uint8_t indent{}; /// The number of leading whitespaces or tabs * 4
     LineType line_type{};
+    /// Information from the history (blame).
     std::string prev_commit_hash;
     std::string prev_author;
     LocalDateTime prev_time{};
 
+    /** Classify line to empty / code / comment / single punctuation char.
+      * Very rough and mostly suitable for our C++ style.
+      */
     void setLineInfo(std::string full_line)
     {
         indent = 0;
@@ -306,8 +310,9 @@ struct LineChange
             line_type = LineType::Empty;
         }
         else if (pos + 1 < end
-            && ((pos[0] == '/' && pos[1] == '/')
-                || (pos[0] == '*' && pos[1] == ' '))) /// This is not precise.
+            && ((pos[0] == '/' && (pos[1] == '/' || pos[1] == '*'))
+                || (pos[0] == '*' && pos[1] == ' ')     /// This is not precise.
+                || (pos[0] == '#' && pos[1] == ' ')))
         {
             line_type = LineType::Comment;
         }
@@ -363,6 +368,18 @@ struct LineChange
 
 using LineChanges = std::vector<LineChange>;
 
+struct FileDiff
+{
+    FileDiff(FileChange file_change_) : file_change(file_change_) {}
+
+    FileChange file_change;
+    LineChanges line_changes;
+};
+
+using CommitDiff = std::map<std::string /* path */, FileDiff>;
+
+
+/** Parsing helpers */
 
 void skipUntilWhitespace(ReadBuffer & buf)
 {
@@ -418,14 +435,57 @@ void readStringUntilNextLine(std::string & s, ReadBuffer & buf)
 }
 
 
-struct Result
+/** Writes the resulting tables to files that can be imported to ClickHouse.
+  */
+struct ResultWriter
 {
     WriteBufferFromFile commits{"commits.tsv"};
     WriteBufferFromFile file_changes{"file_changes.tsv"};
     WriteBufferFromFile line_changes{"line_changes.tsv"};
+
+    void appendCommit(const Commit & commit, const CommitDiff & files)
+    {
+        /// commits table
+        {
+            auto & out = commits;
+
+            commit.writeTextWithoutNewline(out);
+            writeChar('\n', out);
+        }
+
+        for (const auto & elem : files)
+        {
+            const FileChange & file_change = elem.second.file_change;
+
+            /// file_changes table
+            {
+                auto & out = file_changes;
+
+                file_change.writeTextWithoutNewline(out);
+                writeChar('\t', out);
+                commit.writeTextWithoutNewline(out);
+                writeChar('\n', out);
+            }
+
+            /// line_changes table
+            for (const auto & line_change : elem.second.line_changes)
+            {
+                auto & out = line_changes;
+
+                line_change.writeTextWithoutNewline(out);
+                writeChar('\t', out);
+                file_change.writeTextWithoutNewline(out);
+                writeChar('\t', out);
+                commit.writeTextWithoutNewline(out);
+                writeChar('\n', out);
+            }
+        }
+    }
 };
 
 
+/** See description in "main".
+  */
 struct Options
 {
     bool skip_commits_without_parents = true;
@@ -467,11 +527,23 @@ struct Options
 };
 
 
-/// Rough snapshot of repository calculated by application of diffs. It's used to calculate blame info.
+/** Rough snapshot of repository calculated by application of diffs. It's used to calculate blame info.
+  * Represented by a list of lines. For every line it contains information about commit that modified this line the last time.
+  *
+  * Note that there are many cases when this info may become incorrect.
+  * The first reason is that git history is non-linear but we form this snapshot by application of commit diffs in some order
+  *  that cannot give us correct results even theoretically.
+  * The second reason is that we don't process merge commits. But merge commits may contain differences for conflict resolution.
+  *
+  * We expect that the information will be mostly correct for the purpose of analytics.
+  * So, it can provide the expected "blame" info for the most of the lines.
+  */
 struct FileBlame
 {
     using Lines = std::list<Commit>;
     Lines lines;
+
+    /// We walk through this list adding or removing lines.
     Lines::iterator it;
     size_t current_idx = 1;
 
@@ -480,6 +552,7 @@ struct FileBlame
         it = lines.begin();
     }
 
+    /// This is important when file was copied or renamed.
     FileBlame & operator=(const FileBlame & rhs)
     {
         lines = rhs.lines;
@@ -493,6 +566,7 @@ struct FileBlame
         *this = rhs;
     }
 
+    /// Move iterator to requested line or stop at the end.
     void walk(uint32_t num)
     {
         while (current_idx < num && it != lines.end())
@@ -522,6 +596,7 @@ struct FileBlame
     {
         walk(num);
 
+        /// If the inserted line is over the end of file, we insert empty lines before it.
         while (it == lines.end() && current_idx < num)
         {
             lines.emplace_back();
@@ -542,334 +617,24 @@ struct FileBlame
     }
 };
 
+/// All files with their blame info. When file is renamed, we also rename it in snapshot.
 using Snapshot = std::map<std::string /* path */, FileBlame>;
 
-struct FileChangeAndLineChanges
+
+/** Enrich the line changes data with the history info from the snapshot
+  * - the author, time and commit of the previous change to every found line (blame).
+  * And update the snapshot.
+  */
+void updateSnapshot(Snapshot & snapshot, const Commit & commit, CommitDiff & file_changes)
 {
-    FileChangeAndLineChanges(FileChange file_change_) : file_change(file_change_) {}
-
-    FileChange file_change;
-    LineChanges line_changes;
-};
-
-using DiffHashes = std::unordered_set<UInt128>;
-
-
-void processCommit(
-    std::unique_ptr<ShellCommand> & commit_info,
-    const Options & options,
-    size_t commit_num,
-    size_t total_commits,
-    std::string hash,
-    Snapshot & snapshot,
-    DiffHashes & diff_hashes,
-    Result & result)
-{
-    auto & in = commit_info->out;
-
-    Commit commit;
-    commit.hash = hash;
-
-    time_t commit_time;
-    readText(commit_time, in);
-    commit.time = commit_time;
-    assertChar('\0', in);
-    readNullTerminated(commit.author, in);
-    std::string parent_hash;
-    readNullTerminated(parent_hash, in);
-    readNullTerminated(commit.message, in);
-
-    if (options.skip_commits_with_messages && re2_st::RE2::PartialMatch(commit.message, *options.skip_commits_with_messages))
-        return;
-
-    std::string message_to_print = commit.message;
-    std::replace_if(message_to_print.begin(), message_to_print.end(), [](char c){ return std::iscntrl(c); }, ' ');
-
-    std::cerr << fmt::format("{}%  {}  {}  {}\n",
-        commit_num * 100 / total_commits, toString(commit.time), hash, message_to_print);
-
-    if (options.skip_commits_without_parents && commit_num != 0 && parent_hash.empty())
+    /// Renames and copies.
+    for (auto & elem : file_changes)
     {
-        std::cerr << "Warning: skipping commit without parents\n";
-        return;
+        auto & file = elem.second.file_change;
+        if (file.path != file.old_path)
+            snapshot[file.path] = snapshot[file.old_path];
     }
 
-    if (!in.eof())
-        assertChar('\n', in);
-
-    /// File changes in form
-    /// :100644 100644 b90fe6bb94 3ffe4c380f M  src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
-    /// :100644 100644 828dedf6b5 828dedf6b5 R100       dbms/src/Functions/GeoUtils.h   dbms/src/Functions/PolygonUtils.h
-
-    std::map<std::string, FileChangeAndLineChanges> file_changes;
-
-    while (checkChar(':', in))
-    {
-        FileChange file_change;
-
-        for (size_t i = 0; i < 4; ++i)
-        {
-            skipUntilWhitespace(in);
-            skipWhitespaceIfAny(in);
-        }
-
-        char change_type;
-        readChar(change_type, in);
-
-        int confidence;
-        switch (change_type)
-        {
-            case 'A':
-                file_change.change_type = FileChangeType::Add;
-                ++commit.files_added;
-                break;
-            case 'D':
-                file_change.change_type = FileChangeType::Delete;
-                ++commit.files_deleted;
-                break;
-            case 'M':
-                file_change.change_type = FileChangeType::Modify;
-                ++commit.files_modified;
-                break;
-            case 'R':
-                file_change.change_type = FileChangeType::Rename;
-                ++commit.files_renamed;
-                readText(confidence, in);
-                break;
-            case 'C':
-                file_change.change_type = FileChangeType::Copy;
-                readText(confidence, in);
-                break;
-            case 'T':
-                file_change.change_type = FileChangeType::Type;
-                break;
-            default:
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected file change type: {}", change_type);
-        }
-
-        skipWhitespaceIfAny(in);
-
-        if (change_type == 'R' || change_type == 'C')
-        {
-            readText(file_change.old_path, in);
-            skipWhitespaceIfAny(in);
-            readText(file_change.path, in);
-
-//            std::cerr << "Move from " << file_change.old_path << " to " << file_change.path << "\n";
-
-            if (file_change.path != file_change.old_path)
-                snapshot[file_change.path] = snapshot[file_change.old_path];
-        }
-        else
-        {
-            readText(file_change.path, in);
-        }
-
-        file_change.file_extension = std::filesystem::path(file_change.path).extension();
-
-        assertChar('\n', in);
-
-        if (!(options.skip_paths && re2_st::RE2::PartialMatch(file_change.path, *options.skip_paths)))
-        {
-            file_changes.emplace(
-                file_change.path,
-                FileChangeAndLineChanges(file_change));
-        }
-    }
-
-    if (!in.eof())
-    {
-        assertChar('\n', in);
-
-        /// Diffs for every file in form of
-        /// --- a/src/Storages/StorageReplicatedMergeTree.cpp
-        /// +++ b/src/Storages/StorageReplicatedMergeTree.cpp
-        /// @@ -1387,2 +1387 @@ bool StorageReplicatedMergeTree::tryExecuteMerge(const LogEntry & entry)
-        /// -            table_lock, entry.create_time, reserved_space, entry.deduplicate,
-        /// -            entry.force_ttl);
-        /// +            table_lock, entry.create_time, reserved_space, entry.deduplicate);
-
-        std::string old_file_path;
-        std::string new_file_path;
-        FileChangeAndLineChanges * file_change_and_line_changes = nullptr;
-        LineChange line_change;
-
-        while (!in.eof())
-        {
-            if (checkString("@@ ", in))
-            {
-                if (!file_change_and_line_changes)
-                {
-                    auto file_name = new_file_path.empty() ? old_file_path : new_file_path;
-                    auto it = file_changes.find(file_name);
-                    if (file_changes.end() != it)
-                        file_change_and_line_changes = &it->second;
-                }
-
-                if (file_change_and_line_changes)
-                {
-                    uint32_t old_lines = 1;
-                    uint32_t new_lines = 1;
-
-                    assertChar('-', in);
-                    readText(line_change.hunk_start_line_number_old, in);
-                    if (checkChar(',', in))
-                        readText(old_lines, in);
-
-                    assertString(" +", in);
-                    readText(line_change.hunk_start_line_number_new, in);
-                    if (checkChar(',', in))
-                        readText(new_lines, in);
-
-                    if (line_change.hunk_start_line_number_new == 0)
-                        line_change.hunk_start_line_number_new = 1;
-
-                    assertString(" @@", in);
-                    if (checkChar(' ', in))
-                        readStringUntilNextLine(line_change.hunk_context, in);
-                    else
-                        assertChar('\n', in);
-
-                    line_change.hunk_lines_added = new_lines;
-                    line_change.hunk_lines_deleted = old_lines;
-
-                    ++line_change.hunk_num;
-                    line_change.line_number_old = line_change.hunk_start_line_number_old;
-                    line_change.line_number_new = line_change.hunk_start_line_number_new;
-
-                    if (old_lines && new_lines)
-                    {
-                        ++commit.hunks_changed;
-                        ++file_change_and_line_changes->file_change.hunks_changed;
-                    }
-                    else if (old_lines)
-                    {
-                        ++commit.hunks_removed;
-                        ++file_change_and_line_changes->file_change.hunks_removed;
-                    }
-                    else if (new_lines)
-                    {
-                        ++commit.hunks_added;
-                        ++file_change_and_line_changes->file_change.hunks_added;
-                    }
-                }
-            }
-            else if (checkChar('-', in))
-            {
-                if (checkString("-- ", in))
-                {
-                    if (checkString("a/", in))
-                    {
-                        readStringUntilNextLine(old_file_path, in);
-                        line_change = LineChange{};
-                        file_change_and_line_changes = nullptr;
-                    }
-                    else if (checkString("/dev/null", in))
-                    {
-                        old_file_path.clear();
-                        assertChar('\n', in);
-                        line_change = LineChange{};
-                        file_change_and_line_changes = nullptr;
-                    }
-                    else
-                        skipUntilNextLine(in); /// Actually it can be the line in diff. Skip it for simplicity.
-                }
-                else
-                {
-                    if (file_change_and_line_changes)
-                    {
-                        ++commit.lines_deleted;
-                        ++file_change_and_line_changes->file_change.lines_deleted;
-
-                        line_change.sign = -1;
-                        readStringUntilNextLine(line_change.line, in);
-                        line_change.setLineInfo(line_change.line);
-
-                        file_change_and_line_changes->line_changes.push_back(line_change);
-                        ++line_change.line_number_old;
-                    }
-                }
-            }
-            else if (checkChar('+', in))
-            {
-                if (checkString("++ ", in))
-                {
-                    if (checkString("b/", in))
-                    {
-                        readStringUntilNextLine(new_file_path, in);
-                        line_change = LineChange{};
-                        file_change_and_line_changes = nullptr;
-                    }
-                    else if (checkString("/dev/null", in))
-                    {
-                        new_file_path.clear();
-                        assertChar('\n', in);
-                        line_change = LineChange{};
-                        file_change_and_line_changes = nullptr;
-                    }
-                    else
-                        skipUntilNextLine(in); /// Actually it can be the line in diff. Skip it for simplicity.
-                }
-                else
-                {
-                    if (file_change_and_line_changes)
-                    {
-                        ++commit.lines_added;
-                        ++file_change_and_line_changes->file_change.lines_added;
-
-                        line_change.sign = 1;
-                        readStringUntilNextLine(line_change.line, in);
-                        line_change.setLineInfo(line_change.line);
-
-                        file_change_and_line_changes->line_changes.push_back(line_change);
-                        ++line_change.line_number_new;
-                    }
-                }
-            }
-            else
-            {
-                skipUntilNextLine(in);
-            }
-        }
-    }
-
-    if (options.diff_size_limit && commit_num != 0 && commit.lines_added + commit.lines_deleted > *options.diff_size_limit)
-        return;
-
-    /// Calculate hash of diff and skip duplicates
-    if (options.skip_commits_with_duplicate_diffs)
-    {
-        SipHash hasher;
-
-        for (auto & elem : file_changes)
-        {
-            hasher.update(elem.second.file_change.change_type);
-            hasher.update(elem.second.file_change.old_path.size());
-            hasher.update(elem.second.file_change.old_path);
-            hasher.update(elem.second.file_change.path.size());
-            hasher.update(elem.second.file_change.path);
-
-            hasher.update(elem.second.line_changes.size());
-            for (auto & line_change : elem.second.line_changes)
-            {
-                hasher.update(line_change.sign);
-                hasher.update(line_change.line_number_old);
-                hasher.update(line_change.line_number_new);
-                hasher.update(line_change.indent);
-                hasher.update(line_change.line.size());
-                hasher.update(line_change.line);
-            }
-        }
-
-        UInt128 hash_of_diff;
-        hasher.get128(hash_of_diff.low, hash_of_diff.high);
-
-        if (!diff_hashes.insert(hash_of_diff).second)
-            return;
-    }
-
-    /// Update snapshot and blame info
-
     for (auto & elem : file_changes)
     {
 //        std::cerr << elem.first << "\n";
@@ -928,47 +693,379 @@ void processCommit(
             }
         }
     }
+}
 
-    /// Write the result
 
-    /// commits table
+/** Deduplication of commits with identical diffs.
+  */
+using DiffHashes = std::unordered_set<UInt128>;
+
+UInt128 diffHash(const CommitDiff & file_changes)
+{
+    SipHash hasher;
+
+    for (auto & elem : file_changes)
     {
-        auto & out = result.commits;
+        hasher.update(elem.second.file_change.change_type);
+        hasher.update(elem.second.file_change.old_path.size());
+        hasher.update(elem.second.file_change.old_path);
+        hasher.update(elem.second.file_change.path.size());
+        hasher.update(elem.second.file_change.path);
 
-        commit.writeTextWithoutNewline(out);
-        writeChar('\n', out);
+        hasher.update(elem.second.line_changes.size());
+        for (auto & line_change : elem.second.line_changes)
+        {
+            hasher.update(line_change.sign);
+            hasher.update(line_change.line_number_old);
+            hasher.update(line_change.line_number_new);
+            hasher.update(line_change.indent);
+            hasher.update(line_change.line.size());
+            hasher.update(line_change.line);
+        }
     }
 
-    for (const auto & elem : file_changes)
+    UInt128 hash_of_diff;
+    hasher.get128(hash_of_diff.low, hash_of_diff.high);
+
+    return hash_of_diff;
+}
+
+
+/** File changes in form
+  * :100644 100644 b90fe6bb94 3ffe4c380f M  src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+  * :100644 100644 828dedf6b5 828dedf6b5 R100       dbms/src/Functions/GeoUtils.h   dbms/src/Functions/PolygonUtils.h
+  * according to the output of 'git show --raw'
+  */
+void processFileChanges(
+    ReadBuffer & in,
+    const Options & options,
+    Commit & commit,
+    CommitDiff & file_changes)
+{
+    while (checkChar(':', in))
     {
-        const FileChange & file_change = elem.second.file_change;
+        FileChange file_change;
 
-        /// file_changes table
+        /// We don't care about file mode and content hashes.
+        for (size_t i = 0; i < 4; ++i)
         {
-            auto & out = result.file_changes;
-
-            file_change.writeTextWithoutNewline(out);
-            writeChar('\t', out);
-            commit.writeTextWithoutNewline(out);
-            writeChar('\n', out);
+            skipUntilWhitespace(in);
+            skipWhitespaceIfAny(in);
         }
 
-        /// line_changes table
-        for (const auto & line_change : elem.second.line_changes)
-        {
-            auto & out = result.line_changes;
+        char change_type;
+        readChar(change_type, in);
 
-            line_change.writeTextWithoutNewline(out);
-            writeChar('\t', out);
-            file_change.writeTextWithoutNewline(out);
-            writeChar('\t', out);
-            commit.writeTextWithoutNewline(out);
-            writeChar('\n', out);
+        /// For rename and copy there is a number called "score". We ignore it.
+        int score;
+
+        switch (change_type)
+        {
+            case 'A':
+                file_change.change_type = FileChangeType::Add;
+                ++commit.files_added;
+                break;
+            case 'D':
+                file_change.change_type = FileChangeType::Delete;
+                ++commit.files_deleted;
+                break;
+            case 'M':
+                file_change.change_type = FileChangeType::Modify;
+                ++commit.files_modified;
+                break;
+            case 'R':
+                file_change.change_type = FileChangeType::Rename;
+                ++commit.files_renamed;
+                readText(score, in);
+                break;
+            case 'C':
+                file_change.change_type = FileChangeType::Copy;
+                readText(score, in);
+                break;
+            case 'T':
+                file_change.change_type = FileChangeType::Type;
+                break;
+            default:
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected file change type: {}", change_type);
+        }
+
+        skipWhitespaceIfAny(in);
+
+        if (change_type == 'R' || change_type == 'C')
+        {
+            readText(file_change.old_path, in);
+            skipWhitespaceIfAny(in);
+            readText(file_change.path, in);
+        }
+        else
+        {
+            readText(file_change.path, in);
+        }
+
+        file_change.file_extension = std::filesystem::path(file_change.path).extension();
+        /// It gives us extension in form of '.cpp'. There is a reason for it but we remove initial dot for simplicity.
+        if (!file_change.file_extension.empty() && file_change.file_extension.front() == '.')
+            file_change.file_extension = file_change.file_extension.substr(1, std::string::npos);
+
+        assertChar('\n', in);
+
+        if (!(options.skip_paths && re2_st::RE2::PartialMatch(file_change.path, *options.skip_paths)))
+        {
+            file_changes.emplace(
+                file_change.path,
+                FileDiff(file_change));
         }
     }
 }
 
 
+/** Process the list of diffs for every file from the result of "git show".
+  * Caveats:
+  * - changes in binary files can be ignored;
+  * - if a line content begins with '+' or '-' it will be skipped
+  *   it means that if you store diffs in repository and "git show" will display diff-of-diff for you,
+  *   it won't be processed correctly;
+  * - we expect some specific format of the diff; but it may actually depend on git config;
+  * - non-ASCII file names are not processed correctly (they will not be found and will be ignored).
+  */
+void processDiffs(
+    ReadBuffer & in,
+    std::optional<size_t> size_limit,
+    Commit & commit,
+    CommitDiff & file_changes)
+{
+    std::string old_file_path;
+    std::string new_file_path;
+    FileDiff * file_change_and_line_changes = nullptr;
+    LineChange line_change;
+
+    /// Diffs for every file in form of
+    /// --- a/src/Storages/StorageReplicatedMergeTree.cpp
+    /// +++ b/src/Storages/StorageReplicatedMergeTree.cpp
+    /// @@ -1387,2 +1387 @@ bool StorageReplicatedMergeTree::tryExecuteMerge(const LogEntry & entry)
+    /// -            table_lock, entry.create_time, reserved_space, entry.deduplicate,
+    /// -            entry.force_ttl);
+    /// +            table_lock, entry.create_time, reserved_space, entry.deduplicate);
+
+    size_t diff_size = 0;
+    while (!in.eof())
+    {
+        if (checkString("@@ ", in))
+        {
+            if (!file_change_and_line_changes)
+            {
+                auto file_name = new_file_path.empty() ? old_file_path : new_file_path;
+                auto it = file_changes.find(file_name);
+                if (file_changes.end() != it)
+                    file_change_and_line_changes = &it->second;
+            }
+
+            if (file_change_and_line_changes)
+            {
+                uint32_t old_lines = 1;
+                uint32_t new_lines = 1;
+
+                assertChar('-', in);
+                readText(line_change.hunk_start_line_number_old, in);
+                if (checkChar(',', in))
+                    readText(old_lines, in);
+
+                assertString(" +", in);
+                readText(line_change.hunk_start_line_number_new, in);
+                if (checkChar(',', in))
+                    readText(new_lines, in);
+
+                /// This is needed to simplify the logic of updating snapshot:
+                /// When all lines are removed we can treat it as repeated removal of line with number 1.
+                if (line_change.hunk_start_line_number_new == 0)
+                    line_change.hunk_start_line_number_new = 1;
+
+                assertString(" @@", in);
+                if (checkChar(' ', in))
+                    readStringUntilNextLine(line_change.hunk_context, in);
+                else
+                    assertChar('\n', in);
+
+                line_change.hunk_lines_added = new_lines;
+                line_change.hunk_lines_deleted = old_lines;
+
+                ++line_change.hunk_num;
+                line_change.line_number_old = line_change.hunk_start_line_number_old;
+                line_change.line_number_new = line_change.hunk_start_line_number_new;
+
+                if (old_lines && new_lines)
+                {
+                    ++commit.hunks_changed;
+                    ++file_change_and_line_changes->file_change.hunks_changed;
+                }
+                else if (old_lines)
+                {
+                    ++commit.hunks_removed;
+                    ++file_change_and_line_changes->file_change.hunks_removed;
+                }
+                else if (new_lines)
+                {
+                    ++commit.hunks_added;
+                    ++file_change_and_line_changes->file_change.hunks_added;
+                }
+            }
+        }
+        else if (checkChar('-', in))
+        {
+            if (checkString("-- ", in))
+            {
+                if (checkString("a/", in))
+                {
+                    readStringUntilNextLine(old_file_path, in);
+                    line_change = LineChange{};
+                    file_change_and_line_changes = nullptr;
+                }
+                else if (checkString("/dev/null", in))
+                {
+                    old_file_path.clear();
+                    assertChar('\n', in);
+                    line_change = LineChange{};
+                    file_change_and_line_changes = nullptr;
+                }
+                else
+                    skipUntilNextLine(in); /// Actually it can be the line in diff. Skip it for simplicity.
+            }
+            else
+            {
+                ++diff_size;
+                if (file_change_and_line_changes)
+                {
+                    ++commit.lines_deleted;
+                    ++file_change_and_line_changes->file_change.lines_deleted;
+
+                    line_change.sign = -1;
+                    readStringUntilNextLine(line_change.line, in);
+                    line_change.setLineInfo(line_change.line);
+
+                    file_change_and_line_changes->line_changes.push_back(line_change);
+                    ++line_change.line_number_old;
+                }
+            }
+        }
+        else if (checkChar('+', in))
+        {
+            if (checkString("++ ", in))
+            {
+                if (checkString("b/", in))
+                {
+                    readStringUntilNextLine(new_file_path, in);
+                    line_change = LineChange{};
+                    file_change_and_line_changes = nullptr;
+                }
+                else if (checkString("/dev/null", in))
+                {
+                    new_file_path.clear();
+                    assertChar('\n', in);
+                    line_change = LineChange{};
+                    file_change_and_line_changes = nullptr;
+                }
+                else
+                    skipUntilNextLine(in); /// Actually it can be the line in diff. Skip it for simplicity.
+            }
+            else
+            {
+                ++diff_size;
+                if (file_change_and_line_changes)
+                {
+                    ++commit.lines_added;
+                    ++file_change_and_line_changes->file_change.lines_added;
+
+                    line_change.sign = 1;
+                    readStringUntilNextLine(line_change.line, in);
+                    line_change.setLineInfo(line_change.line);
+
+                    file_change_and_line_changes->line_changes.push_back(line_change);
+                    ++line_change.line_number_new;
+                }
+            }
+        }
+        else
+        {
+            /// Unknown lines are ignored.
+            skipUntilNextLine(in);
+        }
+
+        if (size_limit && diff_size > *size_limit)
+            return;
+    }
+}
+
+
+/** Process the "git show" result for a single commit. Append the result to tables.
+  */
+void processCommit(
+    ReadBuffer & in,
+    const Options & options,
+    size_t commit_num,
+    size_t total_commits,
+    std::string hash,
+    Snapshot & snapshot,
+    DiffHashes & diff_hashes,
+    ResultWriter & result)
+{
+    Commit commit;
+    commit.hash = hash;
+
+    time_t commit_time;
+    readText(commit_time, in);
+    commit.time = commit_time;
+    assertChar('\0', in);
+    readNullTerminated(commit.author, in);
+    std::string parent_hash;
+    readNullTerminated(parent_hash, in);
+    readNullTerminated(commit.message, in);
+
+    if (options.skip_commits_with_messages && re2_st::RE2::PartialMatch(commit.message, *options.skip_commits_with_messages))
+        return;
+
+    std::string message_to_print = commit.message;
+    std::replace_if(message_to_print.begin(), message_to_print.end(), [](char c){ return std::iscntrl(c); }, ' ');
+
+    std::cerr << fmt::format("{}%  {}  {}  {}\n",
+        commit_num * 100 / total_commits, toString(commit.time), hash, message_to_print);
+
+    if (options.skip_commits_without_parents && commit_num != 0 && parent_hash.empty())
+    {
+        std::cerr << "Warning: skipping commit without parents\n";
+        return;
+    }
+
+    if (!in.eof())
+        assertChar('\n', in);
+
+    CommitDiff file_changes;
+    processFileChanges(in, options, commit, file_changes);
+
+    if (!in.eof())
+    {
+        assertChar('\n', in);
+        processDiffs(in, commit_num != 0 ? options.diff_size_limit : std::nullopt, commit, file_changes);
+    }
+
+    /// Skip commits with too large diffs.
+    if (options.diff_size_limit && commit_num != 0 && commit.lines_added + commit.lines_deleted > *options.diff_size_limit)
+        return;
+
+    /// Calculate hash of diff and skip duplicates
+    if (options.skip_commits_with_duplicate_diffs && !diff_hashes.insert(diffHash(file_changes)).second)
+        return;
+
+    /// Update snapshot and blame info
+    updateSnapshot(snapshot, commit, file_changes);
+
+    /// Write the result
+    result.appendCommit(commit, file_changes);
+}
+
+
+/** Runs child process and allows to read the result.
+  * Multiple processes can be run for parallel processing.
+  */
 auto gitShow(const std::string & hash)
 {
     std::string command = fmt::format(
@@ -979,9 +1076,11 @@ auto gitShow(const std::string & hash)
 }
 
 
+/** Obtain the list of commits and process them.
+  */
 void processLog(const Options & options)
 {
-    Result result;
+    ResultWriter result;
 
     std::string command = "git log --reverse --no-merges --pretty=%H";
     fmt::print("{}\n", command);
@@ -1019,7 +1118,7 @@ void processLog(const Options & options)
 
     for (size_t i = 0; i < num_commits; ++i)
     {
-        processCommit(show_commands[i % num_threads], options, i, num_commits, hashes[i], snapshot, diff_hashes, result);
+        processCommit(show_commands[i % num_threads]->out, options, i, num_commits, hashes[i], snapshot, diff_hashes, result);
 
         if (!options.stop_after_commit.empty() && hashes[i] == options.stop_after_commit)
             break;

From 94d49e4197b443a6bced0ac0d137ad646c1c1946 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 03:18:15 +0300
Subject: [PATCH 037/341] Minor modifications

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 6e43853d6ba..2add6813008 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -120,7 +120,9 @@ CREATE TABLE git.line_changes
     commit_hunks_changed UInt32
 ) ENGINE = MergeTree ORDER BY time;
 
-Insert the data with the following commands:
+Run the tool.
+
+Then insert the data with the following commands:
 
 clickhouse-client --query "INSERT INTO git.commits FORMAT TSV" < commits.tsv
 clickhouse-client --query "INSERT INTO git.file_changes FORMAT TSV" < file_changes.tsv

From 47ca6211604c6fcb7b2c4e137d739ebff88da975 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 03:25:06 +0300
Subject: [PATCH 038/341] Minor modifications

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 2add6813008..875da3ba0ac 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -993,7 +993,12 @@ void processDiffs(
         }
 
         if (size_limit && diff_size > *size_limit)
+        {
+            /// Drain to avoid "broken pipe" error in child process.
+            while (!in.eof())
+                in.ignore(in.available());
             return;
+        }
     }
 }
 

From 6e0afbecf4fd0ccd04e9dbb82bff6a507545e8d1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 04:02:35 +0300
Subject: [PATCH 039/341] Minor modifications

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 875da3ba0ac..b5488b0d69a 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -138,6 +138,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int INCORRECT_DATA;
+    extern const int CHILD_WAS_NOT_EXITED_NORMALLY;
 }
 
 
@@ -994,9 +995,6 @@ void processDiffs(
 
         if (size_limit && diff_size > *size_limit)
         {
-            /// Drain to avoid "broken pipe" error in child process.
-            while (!in.eof())
-                in.ignore(in.available());
             return;
         }
     }
@@ -1127,6 +1125,19 @@ void processLog(const Options & options)
     {
         processCommit(show_commands[i % num_threads]->out, options, i, num_commits, hashes[i], snapshot, diff_hashes, result);
 
+        try
+        {
+            show_commands[i % num_threads]->wait();
+        }
+        catch (const Exception & e)
+        {
+            /// For broken pipe when we stopped reading prematurally.
+            if (e.code() == ErrorCodes::CHILD_WAS_NOT_EXITED_NORMALLY)
+                std::cerr << getCurrentExceptionMessage(false) << "\n";
+            else
+                throw;
+        }
+
         if (!options.stop_after_commit.empty() && hashes[i] == options.stop_after_commit)
             break;
 

From 69ce9e1f7020df985d7ea6ee450bf0d4b3438a0d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 05:36:54 +0300
Subject: [PATCH 040/341] More documentation

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 45 +++++++++++++++++++
 1 file changed, 45 insertions(+)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index b5488b0d69a..d3b6f77d3d7 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -27,6 +27,51 @@
 
 
 static constexpr auto documentation = R"(
+A tool to extract information from Git repository for analytics.
+
+It dumps the data for the following tables:
+- commits - commits with statistics;
+- file_changes - files changed in every commit with the info about the change and statistics;
+- line_changes - every changed line in every changed file in every commit with full info about the line and the information about previous change of this line.
+
+The largest and the most important table is "line_changes".
+
+Allows to answer questions like:
+- list files with maximum number of authors;
+- show me the oldest lines of code in the repository;
+- show me the files with longest history;
+- list favorite files for author;
+- list largest files with lowest number of authors;
+- at what weekday the code has highest chance to stay in repository;
+- the distribution of code age across repository;
+- files sorted by average code age;
+- quickly show file with blame info (rough);
+- commits and lines of code distribution by time; by weekday, by author; for specific subdirectories;
+- show history for every subdirectory, file, line of file, the number of changes (lines and commits) across time; how the number of contributors was changed across time;
+- list files with most modifications;
+- list files that were rewritten most number of time or by most of authors;
+- what is percentage of code removal by other authors, across authors;
+- the matrix of authors that shows what authors tends to rewrite another authors code;
+- what is the worst time to write code in sense that the code has highest chance to be rewritten;
+- the average time before code will be rewritten and the median (half-life of code decay);
+- comments/code percentage change in time / by author / by location;
+- who tend to write more tests / cpp code / comments.
+
+The data is intended for analytical purposes. It can be imprecise by many reasons but it should be good enough for its purpose.
+
+The data is not intended to provide any conclusions for managers, it is especially counter-indicative for any kinds of "performance review". Instead you can spend multiple days looking at various interesting statistics.
+
+Run this tool inside your git repository. It will create .tsv files that can be loaded into ClickHouse (or into other DBMS if you dare).
+
+The tool can process large enough repositories in a reasonable time.
+It has been tested on:
+- ClickHouse: 31 seconds; 3 million rows;
+- LLVM: 8 minues; 62 million rows;
+- Linux - 12 minutes; 85 million rows;
+- Chromium - 67 minutes; 343 million rows;
+(the numbers as of Sep 2020)
+
+
 Prepare the database by executing the following queries:
 
 DROP DATABASE IF EXISTS git;

From 1dc48f66710c5a93e5376320ea7cf3c4a18046d5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 05:39:08 +0300
Subject: [PATCH 041/341] Better help

---
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index d3b6f77d3d7..6ef82ac3b6b 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -13,6 +13,7 @@
 
 #include <boost/program_options.hpp>
 
+#include <Common/TerminalSize.h>
 #include <Common/Exception.h>
 #include <Common/SipHash.h>
 #include <Common/StringUtils/StringUtils.h>
@@ -1199,7 +1200,7 @@ try
 {
     using namespace DB;
 
-    po::options_description desc("Allowed options");
+    po::options_description desc("Allowed options", getTerminalWidth());
     desc.add_options()
         ("help,h", "produce help message")
         ("skip-commits-without-parents", po::value<bool>()->default_value(true),

From 1400bdbf83c9ebf6e63eeda73966b7e7c0210d80 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 06:11:35 +0300
Subject: [PATCH 042/341] Fix unit tests

---
 src/Common/ShellCommand.cpp                   | 23 +++++++++++++++----
 utils/git-to-clickhouse/git-to-clickhouse.cpp | 13 -----------
 2 files changed, 18 insertions(+), 18 deletions(-)

diff --git a/src/Common/ShellCommand.cpp b/src/Common/ShellCommand.cpp
index 127f95fef06..bbb8801f190 100644
--- a/src/Common/ShellCommand.cpp
+++ b/src/Common/ShellCommand.cpp
@@ -57,7 +57,16 @@ ShellCommand::~ShellCommand()
             LOG_WARNING(getLogger(), "Cannot kill shell command pid {} errno '{}'", pid, errnoToString(retcode));
     }
     else if (!wait_called)
-        tryWait();
+    {
+        try
+        {
+            tryWait();
+        }
+        catch (...)
+        {
+            tryLogCurrentException(getLogger());
+        }
+    }
 }
 
 void ShellCommand::logCommand(const char * filename, char * const argv[])
@@ -74,7 +83,8 @@ void ShellCommand::logCommand(const char * filename, char * const argv[])
     LOG_TRACE(ShellCommand::getLogger(), "Will start shell command '{}' with arguments {}", filename, args.str());
 }
 
-std::unique_ptr<ShellCommand> ShellCommand::executeImpl(const char * filename, char * const argv[], bool pipe_stdin_only, bool terminate_in_destructor)
+std::unique_ptr<ShellCommand> ShellCommand::executeImpl(
+    const char * filename, char * const argv[], bool pipe_stdin_only, bool terminate_in_destructor)
 {
     logCommand(filename, argv);
 
@@ -130,7 +140,8 @@ std::unique_ptr<ShellCommand> ShellCommand::executeImpl(const char * filename, c
         _exit(int(ReturnCodes::CANNOT_EXEC));
     }
 
-    std::unique_ptr<ShellCommand> res(new ShellCommand(pid, pipe_stdin.fds_rw[1], pipe_stdout.fds_rw[0], pipe_stderr.fds_rw[0], terminate_in_destructor));
+    std::unique_ptr<ShellCommand> res(new ShellCommand(
+        pid, pipe_stdin.fds_rw[1], pipe_stdout.fds_rw[0], pipe_stderr.fds_rw[0], terminate_in_destructor));
 
     LOG_TRACE(getLogger(), "Started shell command '{}' with pid {}", filename, pid);
 
@@ -143,7 +154,8 @@ std::unique_ptr<ShellCommand> ShellCommand::executeImpl(const char * filename, c
 }
 
 
-std::unique_ptr<ShellCommand> ShellCommand::execute(const std::string & command, bool pipe_stdin_only, bool terminate_in_destructor)
+std::unique_ptr<ShellCommand> ShellCommand::execute(
+    const std::string & command, bool pipe_stdin_only, bool terminate_in_destructor)
 {
     /// Arguments in non-constant chunks of memory (as required for `execv`).
     /// Moreover, their copying must be done before calling `vfork`, so after `vfork` do a minimum of things.
@@ -157,7 +169,8 @@ std::unique_ptr<ShellCommand> ShellCommand::execute(const std::string & command,
 }
 
 
-std::unique_ptr<ShellCommand> ShellCommand::executeDirect(const std::string & path, const std::vector<std::string> & arguments, bool terminate_in_destructor)
+std::unique_ptr<ShellCommand> ShellCommand::executeDirect(
+    const std::string & path, const std::vector<std::string> & arguments, bool terminate_in_destructor)
 {
     size_t argv_sum_size = path.size() + 1;
     for (const auto & arg : arguments)
diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/utils/git-to-clickhouse/git-to-clickhouse.cpp
index 6ef82ac3b6b..a081efa3f47 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/utils/git-to-clickhouse/git-to-clickhouse.cpp
@@ -1171,19 +1171,6 @@ void processLog(const Options & options)
     {
         processCommit(show_commands[i % num_threads]->out, options, i, num_commits, hashes[i], snapshot, diff_hashes, result);
 
-        try
-        {
-            show_commands[i % num_threads]->wait();
-        }
-        catch (const Exception & e)
-        {
-            /// For broken pipe when we stopped reading prematurally.
-            if (e.code() == ErrorCodes::CHILD_WAS_NOT_EXITED_NORMALLY)
-                std::cerr << getCurrentExceptionMessage(false) << "\n";
-            else
-                throw;
-        }
-
         if (!options.stop_after_commit.empty() && hashes[i] == options.stop_after_commit)
             break;
 

From d18e7adbc03e4e7d7ee268e8f90a14e73be7b021 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 06:22:47 +0300
Subject: [PATCH 043/341] Add git-import as a tool

---
 programs/CMakeLists.txt                        | 18 ++++++++++++++----
 programs/config_tools.h.in                     |  1 +
 programs/git-import/CMakeLists.txt             | 10 ++++++++++
 programs/git-import/clickhouse-git-import.cpp  |  2 ++
 .../git-import/git-import.cpp                  |  4 ++--
 programs/install/Install.cpp                   |  1 +
 programs/main.cpp                              |  6 ++++++
 utils/CMakeLists.txt                           |  1 -
 utils/git-to-clickhouse/CMakeLists.txt         |  2 --
 9 files changed, 36 insertions(+), 9 deletions(-)
 create mode 100644 programs/git-import/CMakeLists.txt
 create mode 100644 programs/git-import/clickhouse-git-import.cpp
 rename utils/git-to-clickhouse/git-to-clickhouse.cpp => programs/git-import/git-import.cpp (99%)
 delete mode 100644 utils/git-to-clickhouse/CMakeLists.txt

diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index 89220251cda..ae4a72ef62a 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -16,6 +16,7 @@ option (ENABLE_CLICKHOUSE_COMPRESSOR "Enable clickhouse-compressor" ${ENABLE_CLI
 option (ENABLE_CLICKHOUSE_COPIER "Enable clickhouse-copier" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_FORMAT "Enable clickhouse-format" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_OBFUSCATOR "Enable clickhouse-obfuscator" ${ENABLE_CLICKHOUSE_ALL})
+option (ENABLE_CLICKHOUSE_GIT_IMPORT "Enable clickhouse-git-import" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_ODBC_BRIDGE "Enable clickhouse-odbc-bridge" ${ENABLE_CLICKHOUSE_ALL})
 
 if (CLICKHOUSE_SPLIT_BINARY)
@@ -91,21 +92,22 @@ add_subdirectory (copier)
 add_subdirectory (format)
 add_subdirectory (obfuscator)
 add_subdirectory (install)
+add_subdirectory (git-import)
 
 if (ENABLE_CLICKHOUSE_ODBC_BRIDGE)
     add_subdirectory (odbc-bridge)
 endif ()
 
 if (CLICKHOUSE_ONE_SHARED)
-    add_library(clickhouse-lib SHARED ${CLICKHOUSE_SERVER_SOURCES} ${CLICKHOUSE_CLIENT_SOURCES} ${CLICKHOUSE_LOCAL_SOURCES} ${CLICKHOUSE_BENCHMARK_SOURCES} ${CLICKHOUSE_COPIER_SOURCES} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_SOURCES} ${CLICKHOUSE_COMPRESSOR_SOURCES} ${CLICKHOUSE_FORMAT_SOURCES} ${CLICKHOUSE_OBFUSCATOR_SOURCES} ${CLICKHOUSE_ODBC_BRIDGE_SOURCES})
-    target_link_libraries(clickhouse-lib ${CLICKHOUSE_SERVER_LINK} ${CLICKHOUSE_CLIENT_LINK} ${CLICKHOUSE_LOCAL_LINK} ${CLICKHOUSE_BENCHMARK_LINK} ${CLICKHOUSE_COPIER_LINK} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_LINK} ${CLICKHOUSE_COMPRESSOR_LINK} ${CLICKHOUSE_FORMAT_LINK} ${CLICKHOUSE_OBFUSCATOR_LINK} ${CLICKHOUSE_ODBC_BRIDGE_LINK})
-    target_include_directories(clickhouse-lib ${CLICKHOUSE_SERVER_INCLUDE} ${CLICKHOUSE_CLIENT_INCLUDE} ${CLICKHOUSE_LOCAL_INCLUDE} ${CLICKHOUSE_BENCHMARK_INCLUDE} ${CLICKHOUSE_COPIER_INCLUDE} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_INCLUDE} ${CLICKHOUSE_COMPRESSOR_INCLUDE} ${CLICKHOUSE_FORMAT_INCLUDE} ${CLICKHOUSE_OBFUSCATOR_INCLUDE} ${CLICKHOUSE_ODBC_BRIDGE_INCLUDE})
+    add_library(clickhouse-lib SHARED ${CLICKHOUSE_SERVER_SOURCES} ${CLICKHOUSE_CLIENT_SOURCES} ${CLICKHOUSE_LOCAL_SOURCES} ${CLICKHOUSE_BENCHMARK_SOURCES} ${CLICKHOUSE_COPIER_SOURCES} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_SOURCES} ${CLICKHOUSE_COMPRESSOR_SOURCES} ${CLICKHOUSE_FORMAT_SOURCES} ${CLICKHOUSE_OBFUSCATOR_SOURCES} ${CLICKHOUSE_GIT_IMPORT_SOURCES} ${CLICKHOUSE_ODBC_BRIDGE_SOURCES})
+    target_link_libraries(clickhouse-lib ${CLICKHOUSE_SERVER_LINK} ${CLICKHOUSE_CLIENT_LINK} ${CLICKHOUSE_LOCAL_LINK} ${CLICKHOUSE_BENCHMARK_LINK} ${CLICKHOUSE_COPIER_LINK} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_LINK} ${CLICKHOUSE_COMPRESSOR_LINK} ${CLICKHOUSE_FORMAT_LINK} ${CLICKHOUSE_OBFUSCATOR_LINK} ${CLICKHOUSE_GIT_IMPORT_LINK} ${CLICKHOUSE_ODBC_BRIDGE_LINK})
+    target_include_directories(clickhouse-lib ${CLICKHOUSE_SERVER_INCLUDE} ${CLICKHOUSE_CLIENT_INCLUDE} ${CLICKHOUSE_LOCAL_INCLUDE} ${CLICKHOUSE_BENCHMARK_INCLUDE} ${CLICKHOUSE_COPIER_INCLUDE} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_INCLUDE} ${CLICKHOUSE_COMPRESSOR_INCLUDE} ${CLICKHOUSE_FORMAT_INCLUDE} ${CLICKHOUSE_OBFUSCATOR_INCLUDE} ${CLICKHOUSE_GIT_IMPORT_INCLUDE} ${CLICKHOUSE_ODBC_BRIDGE_INCLUDE})
     set_target_properties(clickhouse-lib PROPERTIES SOVERSION ${VERSION_MAJOR}.${VERSION_MINOR} VERSION ${VERSION_SO} OUTPUT_NAME clickhouse DEBUG_POSTFIX "")
     install (TARGETS clickhouse-lib LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR} COMPONENT clickhouse)
 endif()
 
 if (CLICKHOUSE_SPLIT_BINARY)
-    set (CLICKHOUSE_ALL_TARGETS clickhouse-server clickhouse-client clickhouse-local clickhouse-benchmark clickhouse-extract-from-config clickhouse-compressor clickhouse-format clickhouse-obfuscator clickhouse-copier)
+    set (CLICKHOUSE_ALL_TARGETS clickhouse-server clickhouse-client clickhouse-local clickhouse-benchmark clickhouse-extract-from-config clickhouse-compressor clickhouse-format clickhouse-obfuscator clickhouse-git-import clickhouse-copier)
 
     if (ENABLE_CLICKHOUSE_ODBC_BRIDGE)
         list (APPEND CLICKHOUSE_ALL_TARGETS clickhouse-odbc-bridge)
@@ -149,6 +151,9 @@ else ()
     if (ENABLE_CLICKHOUSE_OBFUSCATOR)
         clickhouse_target_link_split_lib(clickhouse obfuscator)
     endif ()
+    if (ENABLE_CLICKHOUSE_GIT_IMPORT)
+        clickhouse_target_link_split_lib(clickhouse git-import)
+    endif ()
     if (ENABLE_CLICKHOUSE_INSTALL)
         clickhouse_target_link_split_lib(clickhouse install)
     endif ()
@@ -199,6 +204,11 @@ else ()
         install (FILES ${CMAKE_CURRENT_BINARY_DIR}/clickhouse-obfuscator DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
         list(APPEND CLICKHOUSE_BUNDLE clickhouse-obfuscator)
     endif ()
+    if (ENABLE_CLICKHOUSE_GIT_IMPORT)
+        add_custom_target (clickhouse-git-import ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-git-import DEPENDS clickhouse)
+        install (FILES ${CMAKE_CURRENT_BINARY_DIR}/clickhouse-git-import DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+        list(APPEND CLICKHOUSE_BUNDLE clickhouse-git-import)
+    endif ()
     if(ENABLE_CLICKHOUSE_ODBC_BRIDGE)
         list(APPEND CLICKHOUSE_BUNDLE clickhouse-odbc-bridge)
     endif()
diff --git a/programs/config_tools.h.in b/programs/config_tools.h.in
index 11386aca60e..7cb5a6d883a 100644
--- a/programs/config_tools.h.in
+++ b/programs/config_tools.h.in
@@ -12,5 +12,6 @@
 #cmakedefine01 ENABLE_CLICKHOUSE_COMPRESSOR
 #cmakedefine01 ENABLE_CLICKHOUSE_FORMAT
 #cmakedefine01 ENABLE_CLICKHOUSE_OBFUSCATOR
+#cmakedefine01 ENABLE_CLICKHOUSE_GIT_IMPORT
 #cmakedefine01 ENABLE_CLICKHOUSE_INSTALL
 #cmakedefine01 ENABLE_CLICKHOUSE_ODBC_BRIDGE
diff --git a/programs/git-import/CMakeLists.txt b/programs/git-import/CMakeLists.txt
new file mode 100644
index 00000000000..279bb35a272
--- /dev/null
+++ b/programs/git-import/CMakeLists.txt
@@ -0,0 +1,10 @@
+set (CLICKHOUSE_GIT_IMPORT_SOURCES git-import.cpp)
+
+set (CLICKHOUSE_GIT_IMPORT_LINK
+    PRIVATE
+        boost::program_options
+        dbms
+)
+
+clickhouse_program_add(git-import)
+
diff --git a/programs/git-import/clickhouse-git-import.cpp b/programs/git-import/clickhouse-git-import.cpp
new file mode 100644
index 00000000000..cfa06306604
--- /dev/null
+++ b/programs/git-import/clickhouse-git-import.cpp
@@ -0,0 +1,2 @@
+int mainEntryClickHouseGitImport(int argc, char ** argv);
+int main(int argc_, char ** argv_) { return mainEntryClickHouseGitImport(argc_, argv_); }
diff --git a/utils/git-to-clickhouse/git-to-clickhouse.cpp b/programs/git-import/git-import.cpp
similarity index 99%
rename from utils/git-to-clickhouse/git-to-clickhouse.cpp
rename to programs/git-import/git-import.cpp
index a081efa3f47..f1ed4d28c6e 100644
--- a/utils/git-to-clickhouse/git-to-clickhouse.cpp
+++ b/programs/git-import/git-import.cpp
@@ -1182,7 +1182,7 @@ void processLog(const Options & options)
 
 }
 
-int main(int argc, char ** argv)
+int mainEntryClickHouseGitImport(int argc, char ** argv)
 try
 {
     using namespace DB;
@@ -1219,7 +1219,7 @@ try
             << "Usage: " << argv[0] << '\n'
             << desc << '\n'
             << "\nExample:\n"
-            << "\n./git-to-clickhouse --skip-paths 'generated\\.cpp|^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/' --skip-commits-with-messages '^Merge branch '\n";
+            << "\nclickhouse git-import --skip-paths 'generated\\.cpp|^(contrib|docs?|website|libs/(libcityhash|liblz4|libdivide|libvectorclass|libdouble-conversion|libcpuid|libzstd|libfarmhash|libmetrohash|libpoco|libwidechar_width))/' --skip-commits-with-messages '^Merge branch '\n";
         return 1;
     }
 
diff --git a/programs/install/Install.cpp b/programs/install/Install.cpp
index 7b7ab149447..bd60fbb63ba 100644
--- a/programs/install/Install.cpp
+++ b/programs/install/Install.cpp
@@ -205,6 +205,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
             "clickhouse-benchmark",
             "clickhouse-copier",
             "clickhouse-obfuscator",
+            "clickhouse-git-import",
             "clickhouse-compressor",
             "clickhouse-format",
             "clickhouse-extract-from-config"
diff --git a/programs/main.cpp b/programs/main.cpp
index 3df5f9f683b..b91bd732f21 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -46,6 +46,9 @@ int mainEntryClickHouseClusterCopier(int argc, char ** argv);
 #if ENABLE_CLICKHOUSE_OBFUSCATOR
 int mainEntryClickHouseObfuscator(int argc, char ** argv);
 #endif
+#if ENABLE_CLICKHOUSE_GIT_IMPORT
+int mainEntryClickHouseGitImport(int argc, char ** argv);
+#endif
 #if ENABLE_CLICKHOUSE_INSTALL
 int mainEntryClickHouseInstall(int argc, char ** argv);
 int mainEntryClickHouseStart(int argc, char ** argv);
@@ -91,6 +94,9 @@ std::pair<const char *, MainFunc> clickhouse_applications[] =
 #if ENABLE_CLICKHOUSE_OBFUSCATOR
     {"obfuscator", mainEntryClickHouseObfuscator},
 #endif
+#if ENABLE_CLICKHOUSE_GIT_IMPORT
+    {"git-import", mainEntryClickHouseGitImport},
+#endif
 #if ENABLE_CLICKHOUSE_INSTALL
     {"install", mainEntryClickHouseInstall},
     {"start", mainEntryClickHouseStart},
diff --git a/utils/CMakeLists.txt b/utils/CMakeLists.txt
index 93490fba565..b4408a298c3 100644
--- a/utils/CMakeLists.txt
+++ b/utils/CMakeLists.txt
@@ -30,7 +30,6 @@ if (NOT DEFINED ENABLE_UTILS OR ENABLE_UTILS)
     add_subdirectory (checksum-for-compressed-block)
     add_subdirectory (db-generator)
     add_subdirectory (wal-dump)
-    add_subdirectory (git-to-clickhouse)
 endif ()
 
 if (ENABLE_CODE_QUALITY)
diff --git a/utils/git-to-clickhouse/CMakeLists.txt b/utils/git-to-clickhouse/CMakeLists.txt
deleted file mode 100644
index 0e46b68d471..00000000000
--- a/utils/git-to-clickhouse/CMakeLists.txt
+++ /dev/null
@@ -1,2 +0,0 @@
-add_executable (git-to-clickhouse git-to-clickhouse.cpp)
-target_link_libraries(git-to-clickhouse PRIVATE dbms boost::program_options)

From ee54971c3d26ca1219da4909bd30f44bee77fd97 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 07:11:03 +0300
Subject: [PATCH 044/341] Fix build

---
 programs/git-import/git-import.cpp | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/programs/git-import/git-import.cpp b/programs/git-import/git-import.cpp
index f1ed4d28c6e..d314969a1a8 100644
--- a/programs/git-import/git-import.cpp
+++ b/programs/git-import/git-import.cpp
@@ -184,7 +184,6 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int INCORRECT_DATA;
-    extern const int CHILD_WAS_NOT_EXITED_NORMALLY;
 }
 
 
@@ -419,7 +418,7 @@ using LineChanges = std::vector<LineChange>;
 
 struct FileDiff
 {
-    FileDiff(FileChange file_change_) : file_change(file_change_) {}
+    explicit FileDiff(FileChange file_change_) : file_change(file_change_) {}
 
     FileChange file_change;
     LineChanges line_changes;
@@ -546,7 +545,7 @@ struct Options
     std::optional<size_t> diff_size_limit;
     std::string stop_after_commit;
 
-    Options(const po::variables_map & options)
+    explicit Options(const po::variables_map & options)
     {
         skip_commits_without_parents = options["skip-commits-without-parents"].as<bool>();
         skip_commits_with_duplicate_diffs = options["skip-commits-with-duplicate-diffs"].as<bool>();
@@ -753,7 +752,7 @@ UInt128 diffHash(const CommitDiff & file_changes)
 {
     SipHash hasher;
 
-    for (auto & elem : file_changes)
+    for (const auto & elem : file_changes)
     {
         hasher.update(elem.second.file_change.change_type);
         hasher.update(elem.second.file_change.old_path.size());
@@ -762,7 +761,7 @@ UInt128 diffHash(const CommitDiff & file_changes)
         hasher.update(elem.second.file_change.path);
 
         hasher.update(elem.second.line_changes.size());
-        for (auto & line_change : elem.second.line_changes)
+        for (const auto & line_change : elem.second.line_changes)
         {
             hasher.update(line_change.sign);
             hasher.update(line_change.line_number_old);
@@ -1159,6 +1158,8 @@ void processLog(const Options & options)
 
     /// Will run multiple processes in parallel
     size_t num_threads = options.threads;
+    if (num_threads == 0)
+        throw Exception("num-threads cannot be zero", ErrorCodes::INCORRECT_DATA);
 
     std::vector<std::unique_ptr<ShellCommand>> show_commands(num_threads);
     for (size_t i = 0; i < num_commits && i < num_threads; ++i)
@@ -1223,7 +1224,7 @@ try
         return 1;
     }
 
-    processLog(options);
+    processLog(Options(options));
     return 0;
 }
 catch (...)

From 04a69650068c3ff5967f3639c55082dbd34017cf Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 09:40:01 +0300
Subject: [PATCH 045/341] Fix error with executable dictionary source

---
 docker/test/fasttest/run.sh                   |   3 +-
 docker/test/stateless/run.sh                  |   1 +
 docker/test/stateless_unbundled/run.sh        |   1 +
 docker/test/stateless_with_coverage/run.sh    |   1 +
 src/Common/tests/CMakeLists.txt               |   3 +
 src/Common/tests/shell_command_inout.cpp      |  47 +++++++
 .../ExecutableDictionarySource.cpp            | 119 ++++++++++--------
 src/Dictionaries/ExecutableDictionarySource.h |   1 +
 tests/config/executable_dictionary.xml        | 108 ++++++++++++++++
 .../01474_executable_dictionary.reference     |   3 +
 .../01474_executable_dictionary.sql           |   3 +
 11 files changed, 240 insertions(+), 50 deletions(-)
 create mode 100644 src/Common/tests/shell_command_inout.cpp
 create mode 100644 tests/config/executable_dictionary.xml
 create mode 100644 tests/queries/0_stateless/01474_executable_dictionary.reference
 create mode 100644 tests/queries/0_stateless/01474_executable_dictionary.sql

diff --git a/docker/test/fasttest/run.sh b/docker/test/fasttest/run.sh
index 1f8d612a125..9f5a9b05219 100755
--- a/docker/test/fasttest/run.sh
+++ b/docker/test/fasttest/run.sh
@@ -11,7 +11,7 @@ stage=${stage:-}
 
 # A variable to pass additional flags to CMake.
 # Here we explicitly default it to nothing so that bash doesn't complain about
-# it being undefined. Also read it as array so that we can pass an empty list 
+# it being undefined. Also read it as array so that we can pass an empty list
 # of additional variable to cmake properly, and it doesn't generate an extra
 # empty parameter.
 read -ra FASTTEST_CMAKE_FLAGS <<< "${FASTTEST_CMAKE_FLAGS:-}"
@@ -128,6 +128,7 @@ ln -s /usr/share/clickhouse-test/config/access_management.xml /etc/clickhouse-se
 ln -s /usr/share/clickhouse-test/config/ints_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/strings_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/decimals_dictionary.xml /etc/clickhouse-server/
+ln -s /usr/share/clickhouse-test/config/executable_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/macros.xml /etc/clickhouse-server/config.d/
 ln -s /usr/share/clickhouse-test/config/disks.xml /etc/clickhouse-server/config.d/
 #ln -s /usr/share/clickhouse-test/config/secure_ports.xml /etc/clickhouse-server/config.d/
diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 2ff15ca9c6a..4a9ad891883 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -24,6 +24,7 @@ ln -s /usr/share/clickhouse-test/config/access_management.xml /etc/clickhouse-se
 ln -s /usr/share/clickhouse-test/config/ints_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/strings_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/decimals_dictionary.xml /etc/clickhouse-server/
+ln -s /usr/share/clickhouse-test/config/executable_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/macros.xml /etc/clickhouse-server/config.d/
 ln -s /usr/share/clickhouse-test/config/disks.xml /etc/clickhouse-server/config.d/
 ln -s /usr/share/clickhouse-test/config/secure_ports.xml /etc/clickhouse-server/config.d/
diff --git a/docker/test/stateless_unbundled/run.sh b/docker/test/stateless_unbundled/run.sh
index 2ff15ca9c6a..4a9ad891883 100755
--- a/docker/test/stateless_unbundled/run.sh
+++ b/docker/test/stateless_unbundled/run.sh
@@ -24,6 +24,7 @@ ln -s /usr/share/clickhouse-test/config/access_management.xml /etc/clickhouse-se
 ln -s /usr/share/clickhouse-test/config/ints_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/strings_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/decimals_dictionary.xml /etc/clickhouse-server/
+ln -s /usr/share/clickhouse-test/config/executable_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/macros.xml /etc/clickhouse-server/config.d/
 ln -s /usr/share/clickhouse-test/config/disks.xml /etc/clickhouse-server/config.d/
 ln -s /usr/share/clickhouse-test/config/secure_ports.xml /etc/clickhouse-server/config.d/
diff --git a/docker/test/stateless_with_coverage/run.sh b/docker/test/stateless_with_coverage/run.sh
index 64317ee62fd..c3ccb18659b 100755
--- a/docker/test/stateless_with_coverage/run.sh
+++ b/docker/test/stateless_with_coverage/run.sh
@@ -57,6 +57,7 @@ ln -s /usr/share/clickhouse-test/config/access_management.xml /etc/clickhouse-se
 ln -s /usr/share/clickhouse-test/config/ints_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/strings_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/decimals_dictionary.xml /etc/clickhouse-server/
+ln -s /usr/share/clickhouse-test/config/executable_dictionary.xml /etc/clickhouse-server/
 ln -s /usr/share/clickhouse-test/config/macros.xml /etc/clickhouse-server/config.d/
 ln -s /usr/share/clickhouse-test/config/disks.xml /etc/clickhouse-server/config.d/
 ln -s /usr/share/clickhouse-test/config/secure_ports.xml /etc/clickhouse-server/config.d/
diff --git a/src/Common/tests/CMakeLists.txt b/src/Common/tests/CMakeLists.txt
index f6c232cdd22..8de9424e044 100644
--- a/src/Common/tests/CMakeLists.txt
+++ b/src/Common/tests/CMakeLists.txt
@@ -84,3 +84,6 @@ target_link_libraries (procfs_metrics_provider_perf PRIVATE clickhouse_common_io
 
 add_executable (average average.cpp)
 target_link_libraries (average PRIVATE clickhouse_common_io)
+
+add_executable (shell_command_inout shell_command_inout.cpp)
+target_link_libraries (shell_command_inout PRIVATE clickhouse_common_io)
diff --git a/src/Common/tests/shell_command_inout.cpp b/src/Common/tests/shell_command_inout.cpp
new file mode 100644
index 00000000000..615700cd042
--- /dev/null
+++ b/src/Common/tests/shell_command_inout.cpp
@@ -0,0 +1,47 @@
+#include <thread>
+
+#include <Common/ShellCommand.h>
+#include <Common/Exception.h>
+
+#include <IO/ReadBufferFromFileDescriptor.h>
+#include <IO/WriteBufferFromFileDescriptor.h>
+#include <IO/copyData.h>
+
+/** This example shows how we can proxy stdin to ShellCommand and obtain stdout in streaming fashion. */
+
+int main(int argc, char ** argv)
+try
+{
+    using namespace DB;
+
+    if (argc < 2)
+    {
+        std::cerr << "Usage: shell_command_inout 'command...' < in > out\n";
+        return 1;
+    }
+
+    auto command = ShellCommand::execute(argv[1]);
+
+    ReadBufferFromFileDescriptor in(STDIN_FILENO);
+    WriteBufferFromFileDescriptor out(STDOUT_FILENO);
+    WriteBufferFromFileDescriptor err(STDERR_FILENO);
+
+    /// Background thread sends data and foreground thread receives result.
+
+    std::thread thread([&]
+    {
+        copyData(in, command->in);
+        command->in.close();
+    });
+
+    copyData(command->out, out);
+    copyData(command->err, err);
+
+    thread.join();
+    return 0;
+}
+catch (...)
+{
+    std::cerr << DB::getCurrentExceptionMessage(true) << '\n';
+    throw;
+}
diff --git a/src/Dictionaries/ExecutableDictionarySource.cpp b/src/Dictionaries/ExecutableDictionarySource.cpp
index 918cf0732ab..74aab610e0d 100644
--- a/src/Dictionaries/ExecutableDictionarySource.cpp
+++ b/src/Dictionaries/ExecutableDictionarySource.cpp
@@ -1,12 +1,13 @@
 #include "ExecutableDictionarySource.h"
 
-#include <future>
-#include <thread>
+#include <functional>
 #include <ext/scope_guard.h>
 #include <DataStreams/IBlockOutputStream.h>
 #include <DataStreams/OwningBlockInputStream.h>
 #include <Interpreters/Context.h>
 #include <IO/WriteHelpers.h>
+#include <IO/ReadHelpers.h>
+#include <IO/copyData.h>
 #include <Common/ShellCommand.h>
 #include <Common/ThreadPool.h>
 #include <common/logger_useful.h>
@@ -16,6 +17,7 @@
 #include "DictionaryStructure.h"
 #include "registerDictionaries.h"
 
+
 namespace DB
 {
 static const UInt64 max_block_size = 8192;
@@ -31,15 +33,23 @@ namespace
     /// Owns ShellCommand and calls wait for it.
     class ShellCommandOwningBlockInputStream : public OwningBlockInputStream<ShellCommand>
     {
+    private:
+        Poco::Logger * log;
     public:
-        ShellCommandOwningBlockInputStream(const BlockInputStreamPtr & impl, std::unique_ptr<ShellCommand> own_)
-            : OwningBlockInputStream(std::move(impl), std::move(own_))
+        ShellCommandOwningBlockInputStream(Poco::Logger * log_, const BlockInputStreamPtr & impl, std::unique_ptr<ShellCommand> command_)
+            : OwningBlockInputStream(std::move(impl), std::move(command_)), log(log_)
         {
         }
 
         void readSuffix() override
         {
             OwningBlockInputStream<ShellCommand>::readSuffix();
+
+            std::string err;
+            readStringUntilEOF(err, own->err);
+            if (!err.empty())
+                LOG_ERROR(log, "Having stderr: {}", err);
+
             own->wait();
         }
     };
@@ -80,7 +90,7 @@ BlockInputStreamPtr ExecutableDictionarySource::loadAll()
     LOG_TRACE(log, "loadAll {}", toString());
     auto process = ShellCommand::execute(command);
     auto input_stream = context.getInputFormat(format, process->out, sample_block, max_block_size);
-    return std::make_shared<ShellCommandOwningBlockInputStream>(input_stream, std::move(process));
+    return std::make_shared<ShellCommandOwningBlockInputStream>(log, input_stream, std::move(process));
 }
 
 BlockInputStreamPtr ExecutableDictionarySource::loadUpdatedAll()
@@ -95,67 +105,77 @@ BlockInputStreamPtr ExecutableDictionarySource::loadUpdatedAll()
     LOG_TRACE(log, "loadUpdatedAll {}", command_with_update_field);
     auto process = ShellCommand::execute(command_with_update_field);
     auto input_stream = context.getInputFormat(format, process->out, sample_block, max_block_size);
-    return std::make_shared<ShellCommandOwningBlockInputStream>(input_stream, std::move(process));
+    return std::make_shared<ShellCommandOwningBlockInputStream>(log, input_stream, std::move(process));
 }
 
 namespace
 {
-    /** A stream, that also runs and waits for background thread
-      * (that will feed data into pipe to be read from the other side of the pipe).
+    /** A stream, that runs child process and sends data to its stdin in background thread,
+      *  and receives data from its stdout.
       */
     class BlockInputStreamWithBackgroundThread final : public IBlockInputStream
     {
     public:
         BlockInputStreamWithBackgroundThread(
-            const BlockInputStreamPtr & stream_, std::unique_ptr<ShellCommand> && command_, std::packaged_task<void()> && task_)
-            : stream{stream_}, command{std::move(command_)}, task(std::move(task_)), thread([this] {
-                task();
-                command->in.close();
-            })
+            const Context & context,
+            const std::string & format,
+            const Block & sample_block,
+            const std::string & command_str,
+            Poco::Logger * log_,
+            std::function<void(WriteBufferFromFile &)> && send_data_)
+            : log(log_),
+            command(ShellCommand::execute(command_str)),
+            send_data(std::move(send_data_)),
+            thread([this] { send_data(command->in); })
         {
-            children.push_back(stream);
+            //WriteBufferFromFileDescriptor err(STDERR_FILENO);
+            //copyData(command->out, err);
+            //err.next();
+            //thread.join();
+            stream = context.getInputFormat(format, command->out, sample_block, max_block_size);
         }
 
         ~BlockInputStreamWithBackgroundThread() override
         {
             if (thread.joinable())
-            {
-                try
-                {
-                    readSuffix();
-                }
-                catch (...)
-                {
-                    tryLogCurrentException(__PRETTY_FUNCTION__);
-                }
-            }
+                thread.join();
         }
 
-        Block getHeader() const override { return stream->getHeader(); }
+        Block getHeader() const override
+        {
+            return stream->getHeader();
+        }
 
     private:
-        Block readImpl() override { return stream->read(); }
+        Block readImpl() override
+        {
+            return stream->read();
+        }
+
+        void readPrefix() override
+        {
+            stream->readPrefix();
+        }
 
         void readSuffix() override
         {
-            IBlockInputStream::readSuffix();
-            if (!wait_called)
-            {
-                wait_called = true;
-                command->wait();
-            }
-            thread.join();
-            /// To rethrow an exception, if any.
-            task.get_future().get();
+            stream->readSuffix();
+
+            std::string err;
+            readStringUntilEOF(err, command->err);
+            if (!err.empty())
+                LOG_ERROR(log, "Having stderr: {}", err);
+
+            command->wait();
         }
 
         String getName() const override { return "WithBackgroundThread"; }
 
+        Poco::Logger * log;
         BlockInputStreamPtr stream;
         std::unique_ptr<ShellCommand> command;
-        std::packaged_task<void()> task;
-        ThreadFromGlobalPool thread;
-        bool wait_called = false;
+        std::function<void(WriteBufferFromFile &)> send_data;
+        mutable ThreadFromGlobalPool thread;
     };
 
 }
@@ -164,28 +184,29 @@ namespace
 BlockInputStreamPtr ExecutableDictionarySource::loadIds(const std::vector<UInt64> & ids)
 {
     LOG_TRACE(log, "loadIds {} size = {}", toString(), ids.size());
-    auto process = ShellCommand::execute(command);
-
-    auto output_stream = context.getOutputFormat(format, process->in, sample_block);
-    auto input_stream = context.getInputFormat(format, process->out, sample_block, max_block_size);
 
     return std::make_shared<BlockInputStreamWithBackgroundThread>(
-        input_stream, std::move(process), std::packaged_task<void()>([output_stream, &ids]() mutable { formatIDs(output_stream, ids); }));
+        context, format, sample_block, command, log,
+        [&ids, this](WriteBufferFromFile & out) mutable
+        {
+            auto output_stream = context.getOutputFormat(format, out, sample_block);
+            formatIDs(output_stream, ids);
+            out.close();
+        });
 }
 
 BlockInputStreamPtr ExecutableDictionarySource::loadKeys(const Columns & key_columns, const std::vector<size_t> & requested_rows)
 {
     LOG_TRACE(log, "loadKeys {} size = {}", toString(), requested_rows.size());
-    auto process = ShellCommand::execute(command);
-
-    auto output_stream = context.getOutputFormat(format, process->in, sample_block);
-    auto input_stream = context.getInputFormat(format, process->out, sample_block, max_block_size);
 
     return std::make_shared<BlockInputStreamWithBackgroundThread>(
-        input_stream, std::move(process), std::packaged_task<void()>([output_stream, key_columns, &requested_rows, this]() mutable
+        context, format, sample_block, command, log,
+        [key_columns, &requested_rows, this](WriteBufferFromFile & out) mutable
         {
+            auto output_stream = context.getOutputFormat(format, out, sample_block);
             formatKeys(dict_struct, output_stream, key_columns, requested_rows);
-        }));
+            out.close();
+        });
 }
 
 bool ExecutableDictionarySource::isModified() const
diff --git a/src/Dictionaries/ExecutableDictionarySource.h b/src/Dictionaries/ExecutableDictionarySource.h
index f28d71ca5e3..b2aabf26323 100644
--- a/src/Dictionaries/ExecutableDictionarySource.h
+++ b/src/Dictionaries/ExecutableDictionarySource.h
@@ -14,6 +14,7 @@ namespace DB
 /// Allows loading dictionaries from executable
 class ExecutableDictionarySource final : public IDictionarySource
 {
+    friend class BlockInputStreamWithBackgroundThread;
 public:
     ExecutableDictionarySource(
         const DictionaryStructure & dict_struct_,
diff --git a/tests/config/executable_dictionary.xml b/tests/config/executable_dictionary.xml
new file mode 100644
index 00000000000..50df32e2ec6
--- /dev/null
+++ b/tests/config/executable_dictionary.xml
@@ -0,0 +1,108 @@
+<dictionaries>
+
+<dictionary>
+    <name>executable_complex</name>
+    <source>
+        <executable>
+            <format>JSONEachRow</format>
+            <command>cd /; clickhouse-local --input-format JSONEachRow --output-format JSONEachRow --structure 'x UInt64, y UInt64' --query "SELECT x, y, x + y AS a, x * y AS b FROM table"</command>
+        </executable>
+    </source>
+    <lifetime>0</lifetime>
+    <layout>
+        <complex_key_cache>
+            <size_in_cells>1000</size_in_cells>
+        </complex_key_cache>
+    </layout>
+    <structure>
+        <key>
+            <attribute>
+                <name>x</name>
+                <type>UInt64</type>
+            </attribute>
+            <attribute>
+                <name>y</name>
+                <type>UInt64</type>
+            </attribute>
+        </key>
+        <attribute>
+            <name>a</name>
+            <type>UInt64</type>
+            <null_value>0</null_value>
+        </attribute>
+        <attribute>
+            <name>b</name>
+            <type>UInt64</type>
+            <null_value>0</null_value>
+        </attribute>
+    </structure>
+</dictionary>
+
+<dictionary>
+    <name>executable_simple</name>
+    <source>
+        <executable>
+            <format>JSONEachRow</format>
+            <command>cd /; clickhouse-local --input-format JSONEachRow --output-format JSONEachRow --structure 'x UInt64' --query "SELECT x, x + x AS a, x * x AS b FROM table"</command>
+        </executable>
+    </source>
+    <lifetime>0</lifetime>
+    <layout>
+        <cache>
+            <size_in_cells>1000</size_in_cells>
+        </cache>
+    </layout>
+    <structure>
+        <id>
+            <name>x</name>
+        </id>
+        <attribute>
+            <name>a</name>
+            <type>UInt64</type>
+            <null_value>0</null_value>
+        </attribute>
+        <attribute>
+            <name>b</name>
+            <type>UInt64</type>
+            <null_value>0</null_value>
+        </attribute>
+    </structure>
+</dictionary>
+
+<dictionary>
+    <name>executable_complex_direct</name>
+    <source>
+        <executable>
+            <format>JSONEachRow</format>
+            <command>cd /; clickhouse-local --input-format JSONEachRow --output-format JSONEachRow --structure 'x UInt64, y UInt64' --query "SELECT x, y, x + y AS a, x * y AS b FROM table"</command>
+        </executable>
+    </source>
+    <lifetime>0</lifetime>
+    <layout>
+        <complex_key_direct />
+    </layout>
+    <structure>
+        <key>
+            <attribute>
+                <name>x</name>
+                <type>UInt64</type>
+            </attribute>
+            <attribute>
+                <name>y</name>
+                <type>UInt64</type>
+            </attribute>
+        </key>
+        <attribute>
+            <name>a</name>
+            <type>UInt64</type>
+            <null_value>0</null_value>
+        </attribute>
+        <attribute>
+            <name>b</name>
+            <type>UInt64</type>
+            <null_value>0</null_value>
+        </attribute>
+    </structure>
+</dictionary>
+
+</dictionaries>
diff --git a/tests/queries/0_stateless/01474_executable_dictionary.reference b/tests/queries/0_stateless/01474_executable_dictionary.reference
new file mode 100644
index 00000000000..4d0994b08c3
--- /dev/null
+++ b/tests/queries/0_stateless/01474_executable_dictionary.reference
@@ -0,0 +1,3 @@
+999999	1999998	999998000001
+999999	1999998	999998000001
+999999	1999998	999998000001
diff --git a/tests/queries/0_stateless/01474_executable_dictionary.sql b/tests/queries/0_stateless/01474_executable_dictionary.sql
new file mode 100644
index 00000000000..727cf47f79f
--- /dev/null
+++ b/tests/queries/0_stateless/01474_executable_dictionary.sql
@@ -0,0 +1,3 @@
+SELECT number, dictGet('executable_complex', 'a', (number, number)) AS a, dictGet('executable_complex', 'b', (number, number)) AS b FROM numbers(1000000) WHERE number = 999999;
+SELECT number, dictGet('executable_complex_direct', 'a', (number, number)) AS a, dictGet('executable_complex_direct', 'b', (number, number)) AS b FROM numbers(1000000) WHERE number = 999999;
+SELECT number, dictGet('executable_simple', 'a', number) AS a, dictGet('executable_simple', 'b', number) AS b FROM numbers(1000000) WHERE number = 999999;

From 8dd98f74a5a5cd5c5cba804f96b3349c5f9a2e25 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 09:43:28 +0300
Subject: [PATCH 046/341] Remove debug output

---
 src/Dictionaries/ExecutableDictionarySource.cpp | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/Dictionaries/ExecutableDictionarySource.cpp b/src/Dictionaries/ExecutableDictionarySource.cpp
index 74aab610e0d..0709be2420a 100644
--- a/src/Dictionaries/ExecutableDictionarySource.cpp
+++ b/src/Dictionaries/ExecutableDictionarySource.cpp
@@ -128,10 +128,6 @@ namespace
             send_data(std::move(send_data_)),
             thread([this] { send_data(command->in); })
         {
-            //WriteBufferFromFileDescriptor err(STDERR_FILENO);
-            //copyData(command->out, err);
-            //err.next();
-            //thread.join();
             stream = context.getInputFormat(format, command->out, sample_block, max_block_size);
         }
 

From 1f0d2be17adbc292fef91d4b7703d654871cb815 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 09:44:32 +0300
Subject: [PATCH 047/341] Update ExecutableDictionarySource.h

---
 src/Dictionaries/ExecutableDictionarySource.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Dictionaries/ExecutableDictionarySource.h b/src/Dictionaries/ExecutableDictionarySource.h
index b2aabf26323..f28d71ca5e3 100644
--- a/src/Dictionaries/ExecutableDictionarySource.h
+++ b/src/Dictionaries/ExecutableDictionarySource.h
@@ -14,7 +14,6 @@ namespace DB
 /// Allows loading dictionaries from executable
 class ExecutableDictionarySource final : public IDictionarySource
 {
-    friend class BlockInputStreamWithBackgroundThread;
 public:
     ExecutableDictionarySource(
         const DictionaryStructure & dict_struct_,

From 3903794386c32d1894fa266d760eed07419a1d54 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 09:45:01 +0300
Subject: [PATCH 048/341] Update ExecutableDictionarySource.cpp

---
 src/Dictionaries/ExecutableDictionarySource.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Dictionaries/ExecutableDictionarySource.cpp b/src/Dictionaries/ExecutableDictionarySource.cpp
index 0709be2420a..cc250727261 100644
--- a/src/Dictionaries/ExecutableDictionarySource.cpp
+++ b/src/Dictionaries/ExecutableDictionarySource.cpp
@@ -171,7 +171,7 @@ namespace
         BlockInputStreamPtr stream;
         std::unique_ptr<ShellCommand> command;
         std::function<void(WriteBufferFromFile &)> send_data;
-        mutable ThreadFromGlobalPool thread;
+        ThreadFromGlobalPool thread;
     };
 
 }

From 3942cc615f03ecb8e5b9e7437fdc5c57613c245d Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 10:09:42 +0300
Subject: [PATCH 049/341] Update git-import.cpp

---
 programs/git-import/git-import.cpp | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/programs/git-import/git-import.cpp b/programs/git-import/git-import.cpp
index d314969a1a8..45bc47348e7 100644
--- a/programs/git-import/git-import.cpp
+++ b/programs/git-import/git-import.cpp
@@ -9,7 +9,7 @@
 #include <thread>
 #include <filesystem>
 
-#include <re2_st/re2.h>
+#include <re2/re2.h>
 
 #include <boost/program_options.hpp>
 
@@ -539,8 +539,8 @@ struct Options
     bool skip_commits_without_parents = true;
     bool skip_commits_with_duplicate_diffs = true;
     size_t threads = 1;
-    std::optional<re2_st::RE2> skip_paths;
-    std::optional<re2_st::RE2> skip_commits_with_messages;
+    std::optional<re2::RE2> skip_paths;
+    std::optional<re2::RE2> skip_commits_with_messages;
     std::unordered_set<std::string> skip_commits;
     std::optional<size_t> diff_size_limit;
     std::string stop_after_commit;
@@ -857,7 +857,7 @@ void processFileChanges(
 
         assertChar('\n', in);
 
-        if (!(options.skip_paths && re2_st::RE2::PartialMatch(file_change.path, *options.skip_paths)))
+        if (!(options.skip_paths && re2::RE2::PartialMatch(file_change.path, *options.skip_paths)))
         {
             file_changes.emplace(
                 file_change.path,
@@ -1070,7 +1070,7 @@ void processCommit(
     readNullTerminated(parent_hash, in);
     readNullTerminated(commit.message, in);
 
-    if (options.skip_commits_with_messages && re2_st::RE2::PartialMatch(commit.message, *options.skip_commits_with_messages))
+    if (options.skip_commits_with_messages && re2::RE2::PartialMatch(commit.message, *options.skip_commits_with_messages))
         return;
 
     std::string message_to_print = commit.message;

From 4c3c1cdaf3e4064a5d65a40dea5383e522e8f2ee Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Mon, 7 Sep 2020 15:24:27 +0800
Subject: [PATCH 050/341] Fix Nullable String to Enum conversion.

---
 src/Functions/FunctionsConversion.h                  |  4 +---
 .../01490_nullable_string_to_enum.reference          |  1 +
 .../0_stateless/01490_nullable_string_to_enum.sql    | 12 ++++++++++++
 3 files changed, 14 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/01490_nullable_string_to_enum.reference
 create mode 100644 tests/queries/0_stateless/01490_nullable_string_to_enum.sql

diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index a18139fd4c8..ffe7677afe7 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -2260,9 +2260,7 @@ private:
 
                 size_t nullable_pos = block.columns() - 1;
                 nullable_col = typeid_cast<const ColumnNullable *>(block.getByPosition(nullable_pos).column.get());
-                if (!nullable_col)
-                    throw Exception("Last column should be ColumnNullable", ErrorCodes::LOGICAL_ERROR);
-                if (col && nullable_col->size() != col->size())
+                if (col && nullable_col && nullable_col->size() != col->size())
                     throw Exception("ColumnNullable is not compatible with original", ErrorCodes::LOGICAL_ERROR);
             }
 
diff --git a/tests/queries/0_stateless/01490_nullable_string_to_enum.reference b/tests/queries/0_stateless/01490_nullable_string_to_enum.reference
new file mode 100644
index 00000000000..ce013625030
--- /dev/null
+++ b/tests/queries/0_stateless/01490_nullable_string_to_enum.reference
@@ -0,0 +1 @@
+hello
diff --git a/tests/queries/0_stateless/01490_nullable_string_to_enum.sql b/tests/queries/0_stateless/01490_nullable_string_to_enum.sql
new file mode 100644
index 00000000000..e0624af4a7a
--- /dev/null
+++ b/tests/queries/0_stateless/01490_nullable_string_to_enum.sql
@@ -0,0 +1,12 @@
+DROP TABLE IF EXISTS t_enum;
+DROP TABLE IF EXISTS t_source;
+
+CREATE TABLE t_enum(x Enum8('hello' = 1, 'world' = 2)) ENGINE = TinyLog;
+CREATE TABLE t_source(x Nullable(String)) ENGINE = TinyLog;
+
+INSERT INTO t_source (x) VALUES ('hello');
+INSERT INTO t_enum(x) SELECT x from t_source WHERE x in ('hello', 'world');
+SELECT * FROM t_enum;
+
+DROP TABLE IF EXISTS t_enum;
+DROP TABLE IF EXISTS t_source;

From 99ebab706cf70a286a5a6b5b2ac6070085f1ebf0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 12:02:22 +0300
Subject: [PATCH 051/341] Fix "Arcadia"

---
 tests/queries/0_stateless/arcadia_skip_list.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/arcadia_skip_list.txt b/tests/queries/0_stateless/arcadia_skip_list.txt
index 707f91b0c93..16450efb26e 100644
--- a/tests/queries/0_stateless/arcadia_skip_list.txt
+++ b/tests/queries/0_stateless/arcadia_skip_list.txt
@@ -139,3 +139,4 @@
 01455_time_zones
 01456_ast_optimizations_over_distributed
 01460_DistributedFilesToInsert
+01474_executable_dictionary

From 661d9bdb4c1489d6a9c5c8f0ae6d06bb5480a2b9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 7 Sep 2020 19:03:36 +0300
Subject: [PATCH 052/341] Skip test

---
 tests/queries/skip_list.json | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/skip_list.json b/tests/queries/skip_list.json
index adfc5f0e582..0aa98499d42 100644
--- a/tests/queries/skip_list.json
+++ b/tests/queries/skip_list.json
@@ -18,7 +18,8 @@
         "00152_insert_different_granularity",
         "00151_replace_partition_with_different_granularity",
         "00157_cache_dictionary",
-        "01193_metadata_loading"
+        "01193_metadata_loading",
+        "01474_executable_dictionary" /// informational stderr from sanitizer at start
     ],
     "address-sanitizer": [
         "00281",

From 2c04b0a8e67d1aeefdbb523ac4f8cd321b83a347 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Mon, 7 Sep 2020 19:07:34 +0300
Subject: [PATCH 053/341] comment added

---
 .../Formats/Impl/JSONCompactEachRowRowInputFormat.h      | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
index 593f297108c..6845b2974ab 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
@@ -12,7 +12,12 @@ namespace DB
 
 class ReadBuffer;
 
-/** A stream for reading data in JSONCompactEachRow- formats
+/** A stream for reading data in a bunch of formats:
+ *  - JSONCompactEachRow
+ *  - JSONCompactEachRowWithNamesAndTypes
+ *  - JSONCompactStringsEachRow
+ *  - JSONCompactStringsEachRowWithNamesAndTypes
+ *
 */
 class JSONCompactEachRowRowInputFormat : public IRowInputFormat
 {
@@ -54,7 +59,9 @@ private:
     /// This is for the correct exceptions in skipping unknown fields.
     std::vector<String> names_of_columns;
 
+    /// For *WithNamesAndTypes formats.
     bool with_names;
+    /// For JSONCompactString* formats.
     bool yield_strings;
 };
 

From a56d42de67496404fb507d05c2d399012fd479ce Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Mon, 7 Sep 2020 20:55:06 +0300
Subject: [PATCH 054/341] fix arcadia

---
 src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h | 2 --
 src/Processors/ya.make                                         | 3 ---
 2 files changed, 5 deletions(-)

diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
index 6845b2974ab..4077eb6e008 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
@@ -1,7 +1,5 @@
 #pragma once
 
-#pragma once
-
 #include <Core/Block.h>
 #include <Processors/Formats/IRowInputFormat.h>
 #include <Formats/FormatSettings.h>
diff --git a/src/Processors/ya.make b/src/Processors/ya.make
index 27893674859..30de38fedbd 100644
--- a/src/Processors/ya.make
+++ b/src/Processors/ya.make
@@ -31,9 +31,6 @@ SRCS(
     Formats/Impl/JSONEachRowRowOutputFormat.cpp
     Formats/Impl/JSONEachRowWithProgressRowOutputFormat.cpp
     Formats/Impl/JSONRowOutputFormat.cpp
-    Formats/Impl/JSONStringsEachRowRowInputFormat.cpp
-    Formats/Impl/JSONStringsEachRowRowOutputFormat.cpp
-    Formats/Impl/JSONStringsRowOutputFormat.cpp
     Formats/Impl/MarkdownRowOutputFormat.cpp
     Formats/Impl/MsgPackRowInputFormat.cpp
     Formats/Impl/MsgPackRowOutputFormat.cpp

From 0c00b992d5741f7d9750567afd3cbda92b019273 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Mon, 7 Sep 2020 16:01:49 -0700
Subject: [PATCH 055/341] StorageReplicatedMergeTree - cleanup data dir after
 Zk exceptions

It's possible for `getZooKeeper()` to timeout if  zookeeper host(s) can't
be reached. In such cases `Poco::Exception` is thrown after a connection
timeout - refer to `src/Common/ZooKeeper/ZooKeeperImpl.cpp:866` for more info.

Side effect of this is that the CreateQuery gets interrupted and it exits.
But the data Directories for the tables being created aren't cleaned up.
This unclean state will hinder table creation on any retries and will
complain that the Directory for table already exists.

To achieve a clean state on failed table creations, catch this error if
the exception is of type Poco::Exception and call `dropIfEmpty()` method,
then proceed throwing the exception. Without this, the Directory for the
tables need to be manually deleted before retrying the CreateQuery.
---
 src/Storages/StorageReplicatedMergeTree.cpp | 25 ++++++++++++++++++++-
 1 file changed, 24 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6058632d220..64eb1c8d4cd 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -216,7 +216,30 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
         getStorageID().getFullTableName() + " (StorageReplicatedMergeTree::mutationsFinalizingTask)", [this] { mutationsFinalizingTask(); });
 
     if (global_context.hasZooKeeper())
-        current_zookeeper = global_context.getZooKeeper();
+    {
+        /// It's possible for getZooKeeper() to timeout if  zookeeper host(s) can't
+        /// be reached. In such cases Poco::Exception is thrown after a connection
+        /// timeout - refer to src/Common/ZooKeeper/ZooKeeperImpl.cpp:866 for more info.
+        ///
+        /// Side effect of this is that the CreateQuery gets interrupted and it exits.
+        /// But the data Directories for the tables being created aren't cleaned up.
+        /// This unclean state will hinder table creation on any retries and will
+        /// complain that the Directory for table already exists.
+        ///
+        /// To acheive a clean state on failed table creations, catch this error if
+        /// the excaption is of type Poco::Exception and call dropIfEmpty() method,
+        /// then proceed throwing the exception. Without this, the Directory for the
+        /// tables need to be manually deleted before retrying the CreateQuery.
+        try
+        {
+            current_zookeeper = global_context.getZooKeeper();
+        }
+        catch (Poco::Exception & e)
+        {
+            dropIfEmpty();
+            throw e;
+        }
+    }
 
     bool skip_sanity_checks = false;
 

From 806334a642a87c09b77a2b69c765ea10ecbcaad7 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Mon, 7 Sep 2020 22:27:49 -0700
Subject: [PATCH 056/341] StorageReplicatedMergeTree - add integration tests
 that test dir cleanup

This adds a integration test that tests if table directory is cleaned
up after a ZooKeeper connection failure for ReplicatedMergeTree tables.
---
 .../__init__.py                               |  0
 .../configs/remote_servers.xml                | 14 ++++++
 .../test_replicated_zk_conn_failure/test.py   | 45 +++++++++++++++++++
 3 files changed, 59 insertions(+)
 create mode 100644 tests/integration/test_replicated_zk_conn_failure/__init__.py
 create mode 100644 tests/integration/test_replicated_zk_conn_failure/configs/remote_servers.xml
 create mode 100644 tests/integration/test_replicated_zk_conn_failure/test.py

diff --git a/tests/integration/test_replicated_zk_conn_failure/__init__.py b/tests/integration/test_replicated_zk_conn_failure/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_replicated_zk_conn_failure/configs/remote_servers.xml b/tests/integration/test_replicated_zk_conn_failure/configs/remote_servers.xml
new file mode 100644
index 00000000000..538aa72d386
--- /dev/null
+++ b/tests/integration/test_replicated_zk_conn_failure/configs/remote_servers.xml
@@ -0,0 +1,14 @@
+<yandex>
+    <remote_servers>
+        <test_cluster>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <default_database>shard_0</default_database>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster>
+    </remote_servers>
+</yandex>
diff --git a/tests/integration/test_replicated_zk_conn_failure/test.py b/tests/integration/test_replicated_zk_conn_failure/test.py
new file mode 100644
index 00000000000..3f106bd2981
--- /dev/null
+++ b/tests/integration/test_replicated_zk_conn_failure/test.py
@@ -0,0 +1,45 @@
+import time
+
+from helpers.cluster import ClickHouseCluster
+from helpers.network import PartitionManager
+
+
+# This tests if the data directory for a table is cleaned up if there is a Zookeeper
+# connection exception during a CreateQuery operation involving ReplicatedMergeTree tables.
+# Test flow is as follows:
+# 1. Configure cluster with ZooKeeper and create a database.
+# 2. Drop all connections to ZooKeeper.
+# 3. Try creating the table and there would be a Poco:Exception.
+# 4. Try creating the table again and there should not be any error
+# that indicates that the Directory for table already exists.
+
+
+def test_replicated_zk_conn_failure():
+    cluster = ClickHouseCluster(__file__)
+    node1 = cluster.add_instance('node1', main_configs=["configs/remote_servers.xml"], with_zookeeper=True)
+    try:
+        cluster.start()
+        node1.query("CREATE DATABASE replica;")
+        query_create = '''CREATE TABLE replica.test
+        (
+           id Int64,
+           event_time DateTime
+        )
+        Engine=ReplicatedMergeTree('/clickhouse/tables/replica/test', 'node1')
+        PARTITION BY toYYYYMMDD(event_time)
+        ORDER BY id;'''.format(replica=node1.name)
+        with PartitionManager() as pm:
+            pm.drop_instance_zk_connections(node1)
+            time.sleep(5)
+            error = node1.query_and_get_error(query_create)
+            # Assert that there was net exception.
+            assert "Poco::Exception. Code: 1000" in error
+            # Assert that the exception was due to ZooKeeper connectivity.
+            assert "All connection tries failed while connecting to ZooKeeper" in error
+            # retry table creation
+            error = node1.query_and_get_error(query_create)
+            # Should not expect any errors related to directory already existing
+            # and those should have been already cleaned up during the previous retry.
+            assert "Directory for table data data/replica/test/ already exists" not in error
+    finally:
+        cluster.shutdown()

From 78eac658b0d3250c10e177f38a88cc32ef102b3a Mon Sep 17 00:00:00 2001
From: myrrc <me@myrrec.space>
Date: Tue, 8 Sep 2020 22:51:44 +0300
Subject: [PATCH 057/341] adding correct LC nested nullability checker

---
 src/Columns/ColumnLowCardinality.h | 3 ++-
 src/Functions/array/arrayIndex.h   | 8 +++++---
 2 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/src/Columns/ColumnLowCardinality.h b/src/Columns/ColumnLowCardinality.h
index e3b879d6dd5..00f58a133cf 100644
--- a/src/Columns/ColumnLowCardinality.h
+++ b/src/Columns/ColumnLowCardinality.h
@@ -170,7 +170,8 @@ public:
     size_t sizeOfValueIfFixed() const override { return getDictionary().sizeOfValueIfFixed(); }
     bool isNumeric() const override { return getDictionary().isNumeric(); }
     bool lowCardinality() const override { return true; }
-    bool isNullable() const override { return isColumnNullable(*dictionary.getColumnUniquePtr()); }
+
+    bool nestedIsNullable() const { return isColumnNullable(*dictionary.getColumnUnique().getNestedColumn()); }
 
     const IColumnUnique & getDictionary() const { return dictionary.getColumnUnique(); }
     const ColumnPtr & getDictionaryPtr() const { return dictionary.getColumnUniquePtr(); }
diff --git a/src/Functions/array/arrayIndex.h b/src/Functions/array/arrayIndex.h
index b12372d28ce..f96eb09c861 100644
--- a/src/Functions/array/arrayIndex.h
+++ b/src/Functions/array/arrayIndex.h
@@ -1,5 +1,3 @@
-#include <optional>
-#include <type_traits>
 #include <Functions/IFunctionImpl.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
@@ -741,6 +739,10 @@ private:
         if (!col_lc)
             return false;
 
+//        assert(checkAndGetColumn<ColumnNullable>(col_lc->getDictionaryPtr().get()));
+//        assert(col_lc->isNullable());
+//        assert(isColumnNullable(*col_lc->getDictionaryPtr().get()));
+
         const auto [null_map_data, null_map_item] = getNullMaps(block, arguments);
 
         const IColumn& col_arg = *block.getByPosition(arguments[1]).column.get();
@@ -799,7 +801,7 @@ private:
             block.getByPosition(result).column = std::move(col_result);
             return true;
         }
-        else if (col_lc->getDictionaryPtr()->isNullable()) // LC(Nullable(T)) and U
+        else if (col_lc->nestedIsNullable()) // LC(Nullable(T)) and U
         {
             const ColumnPtr left_casted = col_lc->convertToFullColumnIfLowCardinality(); // Nullable(T)
             const ColumnNullable& left_nullable = *checkAndGetColumn<ColumnNullable>(left_casted.get());

From 4f1321daef3af1a4eac14d7c0d33f925e6bb5557 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 8 Sep 2020 23:05:27 +0300
Subject: [PATCH 058/341] Make
 00443_merge_tree_uniform_read_distribution_0.reference real file (was
 symlink)

---
 .../00443_merge_tree_uniform_read_distribution_0.reference    | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)
 mode change 120000 => 100644 tests/queries/0_stateless/00443_merge_tree_uniform_read_distribution_0.reference

diff --git a/tests/queries/0_stateless/00443_merge_tree_uniform_read_distribution_0.reference b/tests/queries/0_stateless/00443_merge_tree_uniform_read_distribution_0.reference
deleted file mode 120000
index 4d2577d02a3..00000000000
--- a/tests/queries/0_stateless/00443_merge_tree_uniform_read_distribution_0.reference
+++ /dev/null
@@ -1 +0,0 @@
-00443_optimize_final_vertical_merge.reference
\ No newline at end of file
diff --git a/tests/queries/0_stateless/00443_merge_tree_uniform_read_distribution_0.reference b/tests/queries/0_stateless/00443_merge_tree_uniform_read_distribution_0.reference
new file mode 100644
index 00000000000..bb6e92ae8e7
--- /dev/null
+++ b/tests/queries/0_stateless/00443_merge_tree_uniform_read_distribution_0.reference
@@ -0,0 +1,3 @@
+1500000	1500000	1500000	1500000	1500000	1500000
+[['def']]	[['','']]
+0

From 014c7c02bdc454a4b53c44d1525c9932906d07ca Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 8 Sep 2020 23:34:10 +0300
Subject: [PATCH 059/341] Fix some trailing whitespaces in query format

The following statements still has the trailing whitespace:
- WITH
- SELECT
- SELECT DISTINCT
- ARRAY JOIN
- GROUP BY
- ORDER BY
- LIMIT BY
---
 src/Parsers/ASTExpressionList.cpp      |  9 +++++++++
 src/Parsers/ASTFunction.cpp            |  1 +
 src/Parsers/ASTSelectQuery.cpp         | 12 +++++++-----
 src/Parsers/ASTTablesInSelectQuery.cpp |  5 ++++-
 src/Parsers/IAST.h                     |  1 +
 5 files changed, 22 insertions(+), 6 deletions(-)

diff --git a/src/Parsers/ASTExpressionList.cpp b/src/Parsers/ASTExpressionList.cpp
index abab1e895cf..de38e1fd7ea 100644
--- a/src/Parsers/ASTExpressionList.cpp
+++ b/src/Parsers/ASTExpressionList.cpp
@@ -13,6 +13,9 @@ ASTPtr ASTExpressionList::clone() const
 
 void ASTExpressionList::formatImpl(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const
 {
+    if (frame.expression_list_prepend_whitespace)
+        settings.ostr << ' ';
+
     for (ASTs::const_iterator it = children.begin(); it != children.end(); ++it)
     {
         if (it != children.begin())
@@ -30,6 +33,12 @@ void ASTExpressionList::formatImplMultiline(const FormatSettings & settings, For
 {
     std::string indent_str = "\n" + std::string(4 * (frame.indent + 1), ' ');
 
+    if (frame.expression_list_prepend_whitespace)
+    {
+        if (!(children.size() > 1 || frame.expression_list_always_start_on_new_line))
+            settings.ostr << ' ';
+    }
+
     ++frame.indent;
     for (ASTs::const_iterator it = children.begin(); it != children.end(); ++it)
     {
diff --git a/src/Parsers/ASTFunction.cpp b/src/Parsers/ASTFunction.cpp
index 07429c8104f..ebef4261d01 100644
--- a/src/Parsers/ASTFunction.cpp
+++ b/src/Parsers/ASTFunction.cpp
@@ -114,6 +114,7 @@ static bool highlightStringLiteralWithMetacharacters(const ASTPtr & node, const
 
 void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const
 {
+    frame.expression_list_prepend_whitespace = false;
     FormatStateStacked nested_need_parens = frame;
     FormatStateStacked nested_dont_need_parens = frame;
     nested_need_parens.need_parens = true;
diff --git a/src/Parsers/ASTSelectQuery.cpp b/src/Parsers/ASTSelectQuery.cpp
index fdc7bd47e4d..499761c4634 100644
--- a/src/Parsers/ASTSelectQuery.cpp
+++ b/src/Parsers/ASTSelectQuery.cpp
@@ -72,18 +72,20 @@ void ASTSelectQuery::formatImpl(const FormatSettings & s, FormatState & state, F
 {
     frame.current_select = this;
     frame.need_parens = false;
+    frame.expression_list_prepend_whitespace = true;
+
     std::string indent_str = s.one_line ? "" : std::string(4 * frame.indent, ' ');
 
     if (with())
     {
-        s.ostr << (s.hilite ? hilite_keyword : "") << indent_str << "WITH " << (s.hilite ? hilite_none : "");
+        s.ostr << (s.hilite ? hilite_keyword : "") << indent_str << "WITH" << (s.hilite ? hilite_none : "");
         s.one_line
             ? with()->formatImpl(s, state, frame)
             : with()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
         s.ostr << s.nl_or_ws;
     }
 
-    s.ostr << (s.hilite ? hilite_keyword : "") << indent_str << "SELECT " << (distinct ? "DISTINCT " : "") << (s.hilite ? hilite_none : "");
+    s.ostr << (s.hilite ? hilite_keyword : "") << indent_str << "SELECT" << (distinct ? " DISTINCT" : "") << (s.hilite ? hilite_none : "");
 
     s.one_line
         ? select()->formatImpl(s, state, frame)
@@ -109,7 +111,7 @@ void ASTSelectQuery::formatImpl(const FormatSettings & s, FormatState & state, F
 
     if (groupBy())
     {
-        s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "GROUP BY " << (s.hilite ? hilite_none : "");
+        s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "GROUP BY" << (s.hilite ? hilite_none : "");
         s.one_line
             ? groupBy()->formatImpl(s, state, frame)
             : groupBy()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
@@ -132,7 +134,7 @@ void ASTSelectQuery::formatImpl(const FormatSettings & s, FormatState & state, F
 
     if (orderBy())
     {
-        s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "ORDER BY " << (s.hilite ? hilite_none : "");
+        s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "ORDER BY" << (s.hilite ? hilite_none : "");
         s.one_line
             ? orderBy()->formatImpl(s, state, frame)
             : orderBy()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
@@ -147,7 +149,7 @@ void ASTSelectQuery::formatImpl(const FormatSettings & s, FormatState & state, F
             s.ostr << ", ";
         }
         limitByLength()->formatImpl(s, state, frame);
-        s.ostr << (s.hilite ? hilite_keyword : "") << " BY " << (s.hilite ? hilite_none : "");
+        s.ostr << (s.hilite ? hilite_keyword : "") << " BY" << (s.hilite ? hilite_none : "");
         s.one_line
             ? limitBy()->formatImpl(s, state, frame)
             : limitBy()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
diff --git a/src/Parsers/ASTTablesInSelectQuery.cpp b/src/Parsers/ASTTablesInSelectQuery.cpp
index 0fd93bbd04d..eb3446ca1c4 100644
--- a/src/Parsers/ASTTablesInSelectQuery.cpp
+++ b/src/Parsers/ASTTablesInSelectQuery.cpp
@@ -210,6 +210,7 @@ void ASTTableJoin::formatImplBeforeTable(const FormatSettings & settings, Format
 void ASTTableJoin::formatImplAfterTable(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const
 {
     frame.need_parens = false;
+    frame.expression_list_prepend_whitespace = false;
 
     if (using_expression_list)
     {
@@ -236,8 +237,10 @@ void ASTTableJoin::formatImpl(const FormatSettings & settings, FormatState & sta
 
 void ASTArrayJoin::formatImpl(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const
 {
+    frame.expression_list_prepend_whitespace = true;
+
     settings.ostr << (settings.hilite ? hilite_keyword : "")
-        << (kind == Kind::Left ? "LEFT " : "") << "ARRAY JOIN " << (settings.hilite ? hilite_none : "");
+        << (kind == Kind::Left ? "LEFT " : "") << "ARRAY JOIN" << (settings.hilite ? hilite_none : "");
 
     settings.one_line
         ? expression_list->formatImpl(settings, state, frame)
diff --git a/src/Parsers/IAST.h b/src/Parsers/IAST.h
index c0c286ac0d2..cf6a7efc102 100644
--- a/src/Parsers/IAST.h
+++ b/src/Parsers/IAST.h
@@ -203,6 +203,7 @@ public:
         UInt8 indent = 0;
         bool need_parens = false;
         bool expression_list_always_start_on_new_line = false;  /// Line feed and indent before expression list even if it's of single element.
+        bool expression_list_prepend_whitespace = false; /// Prepend whitespace (if it is required)
         const IAST * current_select = nullptr;
     };
 

From 03247707737af0f76cacdd6b8b4544e1967f7ed9 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 8 Sep 2020 23:05:47 +0300
Subject: [PATCH 060/341] Remove all trailing whitespaces in tests

sed -r -i \
    -e 's/SELECT $/SELECT/' \
    -e 's/SELECT DISTINCT $/SELECT DISTINCT/' \
    -e 's/WITH $/WITH/' \ # zero matches, new test will be added
    -e 's/ARRAY JOIN $/ARRAY JOIN/' \
    -e 's/GROUP BY $/GROUP BY/' \
    -e 's/ORDER BY $/ORDER BY/' \
    -e 's/LIMIT ([0-9]+) BY $/LIMIT \1 BY/' \ # zero matches, new test will be added
    tests/queries/*/*.sql \
    tests/queries/*/*.reference

(With except for tests/queries/0_stateless/00751_default_databasename_for_view.reference)
---
 .../00239_type_conversion_in_in.sql           |   2 +-
 .../0_stateless/00250_tuple_comparison.sql    |   2 +-
 .../00344_row_number_in_all_blocks.sql        |   2 +-
 .../0_stateless/00436_convert_charset.sql     |   4 +-
 .../00541_to_start_of_fifteen_minutes.sql     |   4 +-
 .../00552_logical_functions_uint8_as_bool.sql |   2 +-
 ...ll_subquery_aggregation_column_removal.sql |  72 +++++-----
 .../00597_push_down_predicate.reference       | 128 +++++++++---------
 .../queries/0_stateless/00618_nullable_in.sql |   4 +-
 .../00712_prewhere_with_alias_bug_2.sql       |   2 +-
 .../00740_optimize_predicate_expression.sql   |   2 +-
 .../00743_limit_by_not_found_column.sql       |   2 +-
 ...51_default_databasename_for_view.reference |   2 +-
 tests/queries/0_stateless/00759_kodieg.sql    |   2 +-
 .../00826_cross_to_inner_join.reference       |  16 +--
 .../00849_multiple_comma_join.reference       |  40 +++---
 .../00849_multiple_comma_join_2.reference     |  30 ++--
 .../0_stateless/00908_analyze_query.reference |   2 +-
 .../0_stateless/00941_to_custom_week.sql      |   2 +-
 ...0957_format_with_clashed_aliases.reference |   2 +-
 ...58_format_of_tuple_array_element.reference |   2 +-
 ...hecksums_in_system_parts_columns_table.sql |   2 +-
 .../01056_predicate_optimizer_bugs.reference  |  26 ++--
 ...76_predicate_optimizer_with_view.reference |   4 +-
 .../01083_cross_to_inner_with_like.reference  |   6 +-
 .../0_stateless/01117_chain_finalize_bug.sql  |   2 +-
 .../01250_fixed_string_comparison.sql         |   2 +-
 ...ithmetic_operations_in_aggr_func.reference |  84 ++++++------
 .../01272_totals_and_filter_bug.sql           |   6 +-
 .../01278_format_multiple_queries.reference   |   4 +-
 .../01300_group_by_other_keys.reference       |  18 +--
 ...01300_group_by_other_keys_having.reference |   8 +-
 ...egate_functions_of_group_by_keys.reference |  28 ++--
 ...monotonous_functions_in_order_by.reference |  12 +-
 .../01322_any_input_optimize.reference        |   4 +-
 ..._redundant_functions_in_order_by.reference |  30 ++--
 .../01355_defaultValueOfArgumentType_bug.sql  |   2 +-
 .../01372_wrong_order_by_removal.reference    |   6 +-
 .../01379_with_fill_several_columns.sql       |   8 +-
 .../01390_remove_injective_in_uniq.reference  |  28 ++--
 ...dicate_when_contains_with_clause.reference |   4 +-
 .../0_stateless/01418_index_analysis_bug.sql  |   4 +-
 ..._duplicate_distinct_optimization.reference |  28 ++--
 .../01470_columns_transformers.reference      |  22 +--
 .../1_stateful/00063_loyalty_joins.sql        |  20 +--
 45 files changed, 341 insertions(+), 341 deletions(-)

diff --git a/tests/queries/0_stateless/00239_type_conversion_in_in.sql b/tests/queries/0_stateless/00239_type_conversion_in_in.sql
index 6e76a31ac56..5589d91ce74 100644
--- a/tests/queries/0_stateless/00239_type_conversion_in_in.sql
+++ b/tests/queries/0_stateless/00239_type_conversion_in_in.sql
@@ -2,7 +2,7 @@ select 1 as x, x = 1 or x = 2 or x = 3 or x = -1;
 select 1 as x, x = 1.0 or x = 2 or x = 3 or x = -1;
 select 1 as x, x = 1.5 or x = 2 or x = 3 or x = -1;
 
-SELECT 
+SELECT
     1 IN (1, -1, 2.0, 2.5), 
     1.0 IN (1, -1, 2.0, 2.5), 
     1 IN (1.0, -1, 2.0, 2.5),
diff --git a/tests/queries/0_stateless/00250_tuple_comparison.sql b/tests/queries/0_stateless/00250_tuple_comparison.sql
index 2ee29ef5863..03a4d23a271 100644
--- a/tests/queries/0_stateless/00250_tuple_comparison.sql
+++ b/tests/queries/0_stateless/00250_tuple_comparison.sql
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     (1, 'Hello', 23) =  (1, 'Hello', 23),
     (1, 'Hello', 23) != (1, 'Hello', 23),
     (1, 'Hello', 23) <  (1, 'Hello', 23),
diff --git a/tests/queries/0_stateless/00344_row_number_in_all_blocks.sql b/tests/queries/0_stateless/00344_row_number_in_all_blocks.sql
index 865d0084ce8..43727f2a14e 100644
--- a/tests/queries/0_stateless/00344_row_number_in_all_blocks.sql
+++ b/tests/queries/0_stateless/00344_row_number_in_all_blocks.sql
@@ -1,5 +1,5 @@
 SET max_block_size = 1000;
-SELECT 
+SELECT
     groupUniqArray(blockSize()),
     uniqExact(rowNumberInAllBlocks()),
     min(rowNumberInAllBlocks()),
diff --git a/tests/queries/0_stateless/00436_convert_charset.sql b/tests/queries/0_stateless/00436_convert_charset.sql
index cba91fe67f4..1b7baf22450 100644
--- a/tests/queries/0_stateless/00436_convert_charset.sql
+++ b/tests/queries/0_stateless/00436_convert_charset.sql
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     'абвгдеёжзийклмнопрстуфхцчшщъыьэюяАБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯ' AS orig,
     hex(convertCharset(orig, 'utf-8', 'cp1251') AS cp1251) AS cp1251_hex,
     hex(convertCharset(orig, 'utf-8', 'utf-7')) AS utf7_hex,
@@ -13,7 +13,7 @@ SELECT
     convertCharset(broken3, 'utf-8', 'koi8-r') AS restored3
 FORMAT Vertical;
 
-SELECT 
+SELECT
     materialize('абвгдеёжзийклмнопрстуфхцчшщъыьэюяАБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯ') AS orig,
     hex(convertCharset(orig, 'utf-8', 'cp1251') AS cp1251) AS cp1251_hex,
     hex(convertCharset(orig, 'utf-8', 'utf-7')) AS utf7_hex,
diff --git a/tests/queries/0_stateless/00541_to_start_of_fifteen_minutes.sql b/tests/queries/0_stateless/00541_to_start_of_fifteen_minutes.sql
index 29056eea3d6..0c20670fad2 100644
--- a/tests/queries/0_stateless/00541_to_start_of_fifteen_minutes.sql
+++ b/tests/queries/0_stateless/00541_to_start_of_fifteen_minutes.sql
@@ -1,7 +1,7 @@
-SELECT 
+SELECT
     DISTINCT result 
 FROM (
-    SELECT 
+    SELECT
         toStartOfFifteenMinutes(toDateTime('2017-12-25 00:00:00') + number * 60) AS result
     FROM system.numbers
     LIMIT 120
diff --git a/tests/queries/0_stateless/00552_logical_functions_uint8_as_bool.sql b/tests/queries/0_stateless/00552_logical_functions_uint8_as_bool.sql
index feee33add1c..f62a02288ed 100644
--- a/tests/queries/0_stateless/00552_logical_functions_uint8_as_bool.sql
+++ b/tests/queries/0_stateless/00552_logical_functions_uint8_as_bool.sql
@@ -10,7 +10,7 @@ SELECT
     1 OR 2 OR 4
 ;
 
-SELECT 
+SELECT
     toUInt8(bitAnd(number, 4)) AS a,
     toUInt8(bitAnd(number, 2)) AS b,
     toUInt8(bitAnd(number, 1)) AS c,
diff --git a/tests/queries/0_stateless/00585_union_all_subquery_aggregation_column_removal.sql b/tests/queries/0_stateless/00585_union_all_subquery_aggregation_column_removal.sql
index 47e6582134a..bf5d2251470 100644
--- a/tests/queries/0_stateless/00585_union_all_subquery_aggregation_column_removal.sql
+++ b/tests/queries/0_stateless/00585_union_all_subquery_aggregation_column_removal.sql
@@ -8,19 +8,19 @@ INSERT INTO clicks VALUES ('facebook.com'), ('yandex.ru'), ('google.com');
 INSERT INTO transactions VALUES ('facebook.com'), ('yandex.ru'), ('baidu.com');
 
 
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
     FROM transactions 
     GROUP BY domain
     UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
@@ -33,19 +33,19 @@ LIMIT 10
 FORMAT JSONEachRow;
 
 
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
     FROM clicks 
     GROUP BY domain
 UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
@@ -60,19 +60,19 @@ FORMAT JSONEachRow;
 
 SELECT DISTINCT * FROM
 (
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
     FROM transactions 
     GROUP BY domain
     UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
@@ -85,19 +85,19 @@ LIMIT 10
 
 UNION ALL
 
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
     FROM clicks 
     GROUP BY domain
 UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
@@ -112,20 +112,20 @@ LIMIT 10
 
 SELECT DISTINCT total, domain FROM
 (
-SELECT 
+SELECT
     sum(total_count) AS total, 
     sum(facebookHits) AS facebook,
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
     FROM transactions 
     GROUP BY domain
     UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
@@ -138,20 +138,20 @@ LIMIT 10
 
 UNION ALL
 
-SELECT 
+SELECT
     sum(total_count) AS total, 
     max(facebookHits) AS facebook,
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
     FROM clicks 
     GROUP BY domain
 UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
@@ -167,19 +167,19 @@ ORDER BY domain, total;
 
 SELECT * FROM
 (
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
     FROM transactions 
     GROUP BY domain
     UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
@@ -192,19 +192,19 @@ LIMIT 10
 ) js1
 ALL FULL OUTER JOIN
 (
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
     FROM clicks 
     GROUP BY domain
 UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
@@ -221,19 +221,19 @@ ORDER BY total, domain;
 
 SELECT total FROM
 (
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
     FROM transactions 
     GROUP BY domain
     UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
@@ -246,19 +246,19 @@ LIMIT 10
 ) js1
 ALL FULL OUTER JOIN
 (
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
     FROM clicks 
     GROUP BY domain
 UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
@@ -275,19 +275,19 @@ ORDER BY total, domain;
 
 SELECT domain FROM
 (
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
     FROM transactions 
     GROUP BY domain
     UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
@@ -300,19 +300,19 @@ LIMIT 10
 ) js1
 ALL FULL OUTER JOIN
 (
-SELECT 
+SELECT
     sum(total_count) AS total, 
     domain
 FROM 
 (
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         SUM(if(domain = 'facebook.com', 1, 0)) AS facebookHits, 
         domain
     FROM clicks 
     GROUP BY domain
 UNION ALL 
-    SELECT 
+    SELECT
         COUNT(*) AS total_count, 
         toUInt64(0) AS facebookHits, 
         domain
diff --git a/tests/queries/0_stateless/00597_push_down_predicate.reference b/tests/queries/0_stateless/00597_push_down_predicate.reference
index 1798c727088..83f783138a0 100644
--- a/tests/queries/0_stateless/00597_push_down_predicate.reference
+++ b/tests/queries/0_stateless/00597_push_down_predicate.reference
@@ -7,18 +7,18 @@
 SELECT count()
 FROM 
 (
-    SELECT 
+    SELECT
         [number] AS a,
         [number * 2] AS b
     FROM system.numbers
     LIMIT 1
 ) AS t
-ARRAY JOIN 
+ARRAY JOIN
     a,
     b
 WHERE NOT ignore(a + b)
 1
-SELECT 
+SELECT
     a,
     b
 FROM 
@@ -27,17 +27,17 @@ FROM
 )
 ANY LEFT JOIN 
 (
-    SELECT 
+    SELECT
         1 AS a,
         1 AS b
 ) USING (a)
 WHERE b = 0
-SELECT 
+SELECT
     a,
     b
 FROM 
 (
-    SELECT 
+    SELECT
         1 AS a,
         1 AS b
 )
@@ -46,7 +46,7 @@ ANY RIGHT JOIN
     SELECT 1 AS a
 ) USING (a)
 WHERE b = 0
-SELECT 
+SELECT
     a,
     b
 FROM 
@@ -55,17 +55,17 @@ FROM
 )
 ANY FULL OUTER JOIN 
 (
-    SELECT 
+    SELECT
         1 AS a,
         1 AS b
 ) USING (a)
 WHERE b = 0
-SELECT 
+SELECT
     a,
     b
 FROM 
 (
-    SELECT 
+    SELECT
         1 AS a,
         1 AS b
 )
@@ -107,22 +107,22 @@ FROM
 )
 WHERE id = 1
 1
-SELECT 
+SELECT
     id,
     subquery
 FROM 
 (
-    SELECT 
+    SELECT
         1 AS id,
         CAST(1, \'UInt8\') AS subquery
 )
 1	1
-SELECT 
+SELECT
     a,
     b
 FROM 
 (
-    SELECT 
+    SELECT
         toUInt64(sum(id) AS b) AS a,
         b
     FROM test_00597
@@ -130,20 +130,20 @@ FROM
 )
 WHERE a = 3
 3	3
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         name,
         value,
         min(id) AS id
     FROM test_00597
-    GROUP BY 
+    GROUP BY
         date,
         name,
         value
@@ -151,12 +151,12 @@ FROM
 )
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     a,
     b
 FROM 
 (
-    SELECT 
+    SELECT
         toUInt64(sum(id) AS b) AS a,
         b
     FROM test_00597 AS table_alias
@@ -164,14 +164,14 @@ FROM
 ) AS outer_table_alias
 WHERE b = 3
 3	3
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -181,21 +181,21 @@ FROM
 )
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
         value
     FROM 
     (
-        SELECT 
+        SELECT
             date,
             id,
             name,
@@ -207,21 +207,21 @@ FROM
 )
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
         value
     FROM 
     (
-        SELECT 
+        SELECT
             date,
             id,
             name,
@@ -233,14 +233,14 @@ FROM
 )
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -250,21 +250,21 @@ FROM
 )
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
         value
     FROM 
     (
-        SELECT 
+        SELECT
             date,
             id,
             name,
@@ -276,14 +276,14 @@ FROM
 )
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -293,21 +293,21 @@ FROM
 ) AS b
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
         value
     FROM 
     (
-        SELECT 
+        SELECT
             date,
             id,
             name,
@@ -319,32 +319,32 @@ FROM
 ) AS b
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     id,
     date,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         id,
         date,
         min(value) AS value
     FROM test_00597
     WHERE id = 1
-    GROUP BY 
+    GROUP BY
         id,
         date
 )
 WHERE id = 1
 1	2000-01-01	1
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -352,7 +352,7 @@ FROM
     FROM test_00597
     WHERE id = 1
     UNION ALL
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -363,7 +363,7 @@ FROM
 WHERE id = 1
 2000-01-01	1	test string 1	1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
@@ -373,7 +373,7 @@ SELECT
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -388,7 +388,7 @@ ANY LEFT JOIN
 ) USING (id)
 WHERE id = 1
 2000-01-01	1	test string 1	1	2000-01-01	test string 1	1
-SELECT 
+SELECT
     id,
     date,
     name,
@@ -399,7 +399,7 @@ FROM
 )
 ANY LEFT JOIN 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -416,14 +416,14 @@ FROM
 ANY LEFT JOIN test_00597 AS b USING (id)
 WHERE value = 1
 1
-SELECT 
+SELECT
     date,
     id,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -433,7 +433,7 @@ FROM
         value
     FROM 
     (
-        SELECT 
+        SELECT
             date,
             id,
             name,
@@ -450,7 +450,7 @@ FROM
 )
 WHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
@@ -460,7 +460,7 @@ SELECT
     b.value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -469,7 +469,7 @@ FROM
 )
 ANY LEFT JOIN 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -478,14 +478,14 @@ ANY LEFT JOIN
 ) AS b USING (id)
 WHERE b.id = 1
 2000-01-01	1	test string 1	1	2000-01-01	test string 1	1
-SELECT 
+SELECT
     id,
     date,
     name,
     value
 FROM 
 (
-    SELECT 
+    SELECT
         toInt8(1) AS id,
         toDate(\'2000-01-01\') AS date
     FROM system.numbers
@@ -493,7 +493,7 @@ FROM
 )
 ANY LEFT JOIN 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -502,7 +502,7 @@ ANY LEFT JOIN
 ) AS b USING (date, id)
 WHERE b.date = toDate(\'2000-01-01\')
 1	2000-01-01	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
@@ -513,7 +513,7 @@ SELECT
     `b.value`
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -524,7 +524,7 @@ FROM
         b.value
     FROM 
     (
-        SELECT 
+        SELECT
             date,
             id,
             name,
@@ -534,7 +534,7 @@ FROM
     ) AS a
     ANY LEFT JOIN 
     (
-        SELECT 
+        SELECT
             date,
             id,
             name,
@@ -545,7 +545,7 @@ FROM
 )
 WHERE id = 1
 2000-01-01	1	test string 1	1	2000-01-01	1	test string 1	1
-SELECT 
+SELECT
     date,
     id,
     name,
@@ -555,7 +555,7 @@ SELECT
     r.value
 FROM 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
@@ -564,14 +564,14 @@ FROM
 )
 SEMI LEFT JOIN 
 (
-    SELECT 
+    SELECT
         date,
         id,
         name,
         value
     FROM 
     (
-        SELECT 
+        SELECT
             date,
             id,
             name,
diff --git a/tests/queries/0_stateless/00618_nullable_in.sql b/tests/queries/0_stateless/00618_nullable_in.sql
index 8e8c26d225d..72e166dc0f5 100644
--- a/tests/queries/0_stateless/00618_nullable_in.sql
+++ b/tests/queries/0_stateless/00618_nullable_in.sql
@@ -1,13 +1,13 @@
 SELECT sum(toNullable('a') IN 'a');
 SELECT countIf(number, toNullable('a') IN ('a', 'b')) FROM numbers(100);
 
-SELECT 
+SELECT
     uniqExact(x) AS u, 
     uniqExactIf(x, name = 'a') AS ue, 
     uniqExactIf(x, name IN ('a', 'b')) AS ui
 FROM 
 (
-    SELECT 
+    SELECT
         toNullable('a') AS name, 
         arrayJoin(range(10)) AS x
 ) 
diff --git a/tests/queries/0_stateless/00712_prewhere_with_alias_bug_2.sql b/tests/queries/0_stateless/00712_prewhere_with_alias_bug_2.sql
index 2c5c494fc1f..97d5e33633a 100644
--- a/tests/queries/0_stateless/00712_prewhere_with_alias_bug_2.sql
+++ b/tests/queries/0_stateless/00712_prewhere_with_alias_bug_2.sql
@@ -4,7 +4,7 @@ CREATE TABLE table (a UInt32,  date Date, b UInt64,  c UInt64, str String, d Int
 
 SELECT alias2 AS alias3
 FROM table 
-ARRAY JOIN 
+ARRAY JOIN
     arr_alias AS alias2, 
     arrayEnumerateUniq(arr_alias) AS _uniq_Event
 WHERE (date = toDate('2010-10-10')) AND (a IN (2, 3)) AND (str NOT IN ('z', 'x')) AND (d != -1)
diff --git a/tests/queries/0_stateless/00740_optimize_predicate_expression.sql b/tests/queries/0_stateless/00740_optimize_predicate_expression.sql
index b016ab49ddd..65b06635808 100644
--- a/tests/queries/0_stateless/00740_optimize_predicate_expression.sql
+++ b/tests/queries/0_stateless/00740_optimize_predicate_expression.sql
@@ -5,7 +5,7 @@ SELECT * FROM (SELECT perf_1.z AS z_1 FROM perf AS perf_1);
 
 SELECT sum(mul)/sqrt(sum(sqr_dif_1) * sum(sqr_dif_2)) AS z_r
 FROM(
-SELECT 
+SELECT
         (SELECT avg(z_1) AS z_1_avg, 
                 avg(z_2) AS z_2_avg
         FROM ( 
diff --git a/tests/queries/0_stateless/00743_limit_by_not_found_column.sql b/tests/queries/0_stateless/00743_limit_by_not_found_column.sql
index 46c6bcb99b2..d20b3b0209e 100644
--- a/tests/queries/0_stateless/00743_limit_by_not_found_column.sql
+++ b/tests/queries/0_stateless/00743_limit_by_not_found_column.sql
@@ -24,7 +24,7 @@ CREATE TEMPORARY TABLE Accounts (AccountID UInt64, Currency String);
 SELECT AccountID
 FROM 
 (
-    SELECT 
+    SELECT
         AccountID, 
         Currency
     FROM Accounts 
diff --git a/tests/queries/0_stateless/00751_default_databasename_for_view.reference b/tests/queries/0_stateless/00751_default_databasename_for_view.reference
index 4814cc77b37..76d5cee02e2 100644
--- a/tests/queries/0_stateless/00751_default_databasename_for_view.reference
+++ b/tests/queries/0_stateless/00751_default_databasename_for_view.reference
@@ -7,7 +7,7 @@ CREATE MATERIALIZED VIEW test_00751.t_mv_00751
 ENGINE = MergeTree
 ORDER BY date
 SETTINGS index_granularity = 8192 AS
-SELECT 
+SELECT
     date,
     platform,
     app
diff --git a/tests/queries/0_stateless/00759_kodieg.sql b/tests/queries/0_stateless/00759_kodieg.sql
index 2037f210dea..9cbe2a0cd7f 100644
--- a/tests/queries/0_stateless/00759_kodieg.sql
+++ b/tests/queries/0_stateless/00759_kodieg.sql
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     [1, 2, 3, 1, 3] AS a, 
     indexOf(arrayReverse(arraySlice(a, 1, -1)), 3) AS offset_from_right, 
     arraySlice(a, multiIf(offset_from_right = 0, 1, (length(a) - offset_from_right) + 1));
diff --git a/tests/queries/0_stateless/00826_cross_to_inner_join.reference b/tests/queries/0_stateless/00826_cross_to_inner_join.reference
index 6e5cbdcab4e..e7c8d6b1ea9 100644
--- a/tests/queries/0_stateless/00826_cross_to_inner_join.reference
+++ b/tests/queries/0_stateless/00826_cross_to_inner_join.reference
@@ -35,7 +35,7 @@ comma nullable
 1	1	1	1
 2	2	1	2
 cross
-SELECT 
+SELECT
     a,
     b,
     t2_00826.a,
@@ -44,7 +44,7 @@ FROM t1_00826
 ALL INNER JOIN t2_00826 ON a = t2_00826.a
 WHERE a = t2_00826.a
 cross nullable
-SELECT 
+SELECT
     a,
     b,
     t2_00826.a,
@@ -53,7 +53,7 @@ FROM t1_00826
 ALL INNER JOIN t2_00826 ON a = t2_00826.a
 WHERE a = t2_00826.a
 cross nullable vs not nullable
-SELECT 
+SELECT
     a,
     b,
     t2_00826.a,
@@ -62,7 +62,7 @@ FROM t1_00826
 ALL INNER JOIN t2_00826 ON a = t2_00826.b
 WHERE a = t2_00826.b
 cross self
-SELECT 
+SELECT
     a,
     b,
     y.a,
@@ -71,7 +71,7 @@ FROM t1_00826 AS x
 ALL INNER JOIN t1_00826 AS y ON (a = y.a) AND (b = y.b)
 WHERE (a = y.a) AND (b = y.b)
 cross one table expr
-SELECT 
+SELECT
     a,
     b,
     t2_00826.a,
@@ -80,7 +80,7 @@ FROM t1_00826
 CROSS JOIN t2_00826
 WHERE a = b
 cross multiple ands
-SELECT 
+SELECT
     a,
     b,
     t2_00826.a,
@@ -89,7 +89,7 @@ FROM t1_00826
 ALL INNER JOIN t2_00826 ON (a = t2_00826.a) AND (b = t2_00826.b)
 WHERE (a = t2_00826.a) AND (b = t2_00826.b)
 cross and inside and
-SELECT 
+SELECT
     a,
     b,
     t2_00826.a,
@@ -98,7 +98,7 @@ FROM t1_00826
 ALL INNER JOIN t2_00826 ON (a = t2_00826.a) AND (a = t2_00826.a) AND (a = t2_00826.a) AND (b = t2_00826.b)
 WHERE (a = t2_00826.a) AND ((a = t2_00826.a) AND ((a = t2_00826.a) AND (b = t2_00826.b)))
 cross split conjunction
-SELECT 
+SELECT
     a,
     b,
     t2_00826.a,
diff --git a/tests/queries/0_stateless/00849_multiple_comma_join.reference b/tests/queries/0_stateless/00849_multiple_comma_join.reference
index 5a5a90cbdf2..f4db2238dd1 100644
--- a/tests/queries/0_stateless/00849_multiple_comma_join.reference
+++ b/tests/queries/0_stateless/00849_multiple_comma_join.reference
@@ -12,7 +12,7 @@ WHERE b = t2_00849.b
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         a AS `--t1_00849.a`,
         b,
         t2_00849.a AS `--t2_00849.a`,
@@ -25,7 +25,7 @@ WHERE (`--t1_00849.a` = `--t2_00849.a`) AND (`--t1_00849.a` = a)
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         a AS `--t1_00849.a`,
         b AS `--t1_00849.b`,
         t2_00849.a,
@@ -38,7 +38,7 @@ WHERE (`--t1_00849.b` = `--t2_00849.b`) AND (`--t1_00849.b` = b)
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1_00849.a`,
         b,
         `--t2_00849.a`,
@@ -47,7 +47,7 @@ FROM
         t3_00849.b
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1_00849.a`,
             b,
             t2_00849.a AS `--t2_00849.a`,
@@ -62,7 +62,7 @@ WHERE (`--t1_00849.a` = `--t2_00849.a`) AND (`--t1_00849.a` = `--t3_00849.a`) AN
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1_00849.a`,
         `--t1_00849.b`,
         `t2_00849.a`,
@@ -71,7 +71,7 @@ FROM
         b AS `--t3_00849.b`
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1_00849.a`,
             b AS `--t1_00849.b`,
             t2_00849.a,
@@ -86,7 +86,7 @@ WHERE (`--t1_00849.b` = `--t2_00849.b`) AND (`--t1_00849.b` = `--t3_00849.b`) AN
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1_00849.a`,
         b,
         `--t2_00849.a`,
@@ -95,7 +95,7 @@ FROM
         t3_00849.b
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1_00849.a`,
             b,
             t2_00849.a AS `--t2_00849.a`,
@@ -110,7 +110,7 @@ WHERE (`--t2_00849.a` = `--t1_00849.a`) AND (`--t2_00849.a` = `--t3_00849.a`) AN
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1_00849.a`,
         b,
         `--t2_00849.a`,
@@ -119,7 +119,7 @@ FROM
         t3_00849.b
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1_00849.a`,
             b,
             t2_00849.a AS `--t2_00849.a`,
@@ -134,7 +134,7 @@ WHERE (`--t3_00849.a` = `--t1_00849.a`) AND (`--t3_00849.a` = `--t2_00849.a`) AN
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1_00849.a`,
         b,
         `--t2_00849.a`,
@@ -143,7 +143,7 @@ FROM
         t3_00849.b
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1_00849.a`,
             b,
             t2_00849.a AS `--t2_00849.a`,
@@ -158,7 +158,7 @@ WHERE (a = `--t1_00849.a`) AND (a = `--t2_00849.a`) AND (a = `--t3_00849.a`)
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1_00849.a`,
         b,
         `--t2_00849.a`,
@@ -167,7 +167,7 @@ FROM
         t3_00849.b
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1_00849.a`,
             b,
             t2_00849.a AS `--t2_00849.a`,
@@ -182,7 +182,7 @@ WHERE (`--t1_00849.a` = `--t2_00849.a`) AND (`--t2_00849.a` = `--t3_00849.a`) AN
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1_00849.a`,
         b,
         `t2_00849.a`,
@@ -191,7 +191,7 @@ FROM
         t3_00849.b
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1_00849.a`,
             b,
             t2_00849.a,
@@ -205,7 +205,7 @@ CROSS JOIN t4_00849
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1_00849.a`,
         b,
         `t2_00849.a`,
@@ -214,7 +214,7 @@ FROM
         t3_00849.b
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1_00849.a`,
             b,
             t2_00849.a,
@@ -228,7 +228,7 @@ CROSS JOIN t4_00849
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         a AS `--t1_00849.a`,
         b,
         t2_00849.a,
@@ -240,7 +240,7 @@ CROSS JOIN t3_00849
 SELECT `--t1_00849.a` AS `t1_00849.a`
 FROM 
 (
-    SELECT 
+    SELECT
         a AS `--t1_00849.a`,
         b,
         t2_00849.a AS `--t2_00849.a`,
diff --git a/tests/queries/0_stateless/00849_multiple_comma_join_2.reference b/tests/queries/0_stateless/00849_multiple_comma_join_2.reference
index e08d6ff1192..fc39ef13935 100644
--- a/tests/queries/0_stateless/00849_multiple_comma_join_2.reference
+++ b/tests/queries/0_stateless/00849_multiple_comma_join_2.reference
@@ -12,7 +12,7 @@ WHERE b = t2.b
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         a AS `--t1.a`,
         t2.a AS `--t2.a`
     FROM t1
@@ -23,7 +23,7 @@ WHERE (`--t1.a` = `--t2.a`) AND (`--t1.a` = a)
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         b AS `--t1.b`,
         a AS `--t1.a`,
         t2.b AS `--t2.b`
@@ -35,13 +35,13 @@ WHERE (`--t1.b` = `--t2.b`) AND (`--t1.b` = b)
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1.a`,
         `--t2.a`,
         a AS `--t3.a`
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1.a`,
             t2.a AS `--t2.a`
         FROM t1
@@ -54,14 +54,14 @@ WHERE (`--t1.a` = `--t2.a`) AND (`--t1.a` = `--t3.a`) AND (`--t1.a` = a)
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1.b`,
         `--t1.a`,
         `--t2.b`,
         b AS `--t3.b`
     FROM 
     (
-        SELECT 
+        SELECT
             b AS `--t1.b`,
             a AS `--t1.a`,
             t2.b AS `--t2.b`
@@ -75,13 +75,13 @@ WHERE (`--t1.b` = `--t2.b`) AND (`--t1.b` = `--t3.b`) AND (`--t1.b` = b)
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1.a`,
         `--t2.a`,
         a AS `--t3.a`
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1.a`,
             t2.a AS `--t2.a`
         FROM t1
@@ -94,13 +94,13 @@ WHERE (`--t2.a` = `--t1.a`) AND (`--t2.a` = `--t3.a`) AND (`--t2.a` = a)
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1.a`,
         `--t2.a`,
         a AS `--t3.a`
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1.a`,
             t2.a AS `--t2.a`
         FROM t1
@@ -113,13 +113,13 @@ WHERE (`--t3.a` = `--t1.a`) AND (`--t3.a` = `--t2.a`) AND (`--t3.a` = a)
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1.a`,
         `--t2.a`,
         a AS `--t3.a`
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1.a`,
             t2.a AS `--t2.a`
         FROM t1
@@ -132,13 +132,13 @@ WHERE (a = `--t1.a`) AND (a = `--t2.a`) AND (a = `--t3.a`)
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         `--t1.a`,
         `--t2.a`,
         a AS `--t3.a`
     FROM 
     (
-        SELECT 
+        SELECT
             a AS `--t1.a`,
             t2.a AS `--t2.a`
         FROM t1
@@ -185,7 +185,7 @@ CROSS JOIN t3
 SELECT `--t1.a` AS `t1.a`
 FROM 
 (
-    SELECT 
+    SELECT
         a AS `--t1.a`,
         t2.a AS `--t2.a`
     FROM t1
diff --git a/tests/queries/0_stateless/00908_analyze_query.reference b/tests/queries/0_stateless/00908_analyze_query.reference
index 0305f528b25..ab9237531f7 100644
--- a/tests/queries/0_stateless/00908_analyze_query.reference
+++ b/tests/queries/0_stateless/00908_analyze_query.reference
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     a,
     b
 FROM a
diff --git a/tests/queries/0_stateless/00941_to_custom_week.sql b/tests/queries/0_stateless/00941_to_custom_week.sql
index a6ff40a6d3f..c7d52e7438b 100644
--- a/tests/queries/0_stateless/00941_to_custom_week.sql
+++ b/tests/queries/0_stateless/00941_to_custom_week.sql
@@ -25,7 +25,7 @@ SELECT toWeek(toDate('2001-01-01'),0) AS w0, toWeek(toDate('2001-01-01'),1) AS w
 SELECT toYearWeek(toDate('2000-12-31'),0), toYearWeek(toDate('2000-12-31'),1), toYearWeek(toDate('2000-12-31'),2), toYearWeek(toDate('2000-12-31'),3), toYearWeek(toDate('2000-12-31'),4), toYearWeek(toDate('2000-12-31'),5), toYearWeek(toDate('2000-12-31'),6), toYearWeek(toDate('2000-12-31'),7);
 
 -- week mode 8,9	
-SELECT 
+SELECT
     toDate('2016-12-21') + number AS d, 
 	  toWeek(d, 8) AS week8,
     toWeek(d, 9) AS week9, 
diff --git a/tests/queries/0_stateless/00957_format_with_clashed_aliases.reference b/tests/queries/0_stateless/00957_format_with_clashed_aliases.reference
index d1c8033b363..d6e53c8b48b 100644
--- a/tests/queries/0_stateless/00957_format_with_clashed_aliases.reference
+++ b/tests/queries/0_stateless/00957_format_with_clashed_aliases.reference
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     1 AS x,
     x.y
 FROM 
diff --git a/tests/queries/0_stateless/00958_format_of_tuple_array_element.reference b/tests/queries/0_stateless/00958_format_of_tuple_array_element.reference
index eaea02ba40b..a2953fa0264 100644
--- a/tests/queries/0_stateless/00958_format_of_tuple_array_element.reference
+++ b/tests/queries/0_stateless/00958_format_of_tuple_array_element.reference
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     (x.1)[1],
     (((x[1]).1)[1]).1,
     (NOT x)[1],
diff --git a/tests/queries/0_stateless/00961_checksums_in_system_parts_columns_table.sql b/tests/queries/0_stateless/00961_checksums_in_system_parts_columns_table.sql
index b9eed1e8183..3b99ebf8b22 100644
--- a/tests/queries/0_stateless/00961_checksums_in_system_parts_columns_table.sql
+++ b/tests/queries/0_stateless/00961_checksums_in_system_parts_columns_table.sql
@@ -4,7 +4,7 @@ CREATE TABLE test_00961 (d Date, a String, b UInt8, x String, y Int8, z UInt32)
 
 INSERT INTO test_00961 VALUES ('2000-01-01', 'Hello, world!', 123, 'xxx yyy', -123, 123456789);
 
-SELECT 
+SELECT
     name, 
     table, 
     hash_of_all_files, 
diff --git a/tests/queries/0_stateless/01056_predicate_optimizer_bugs.reference b/tests/queries/0_stateless/01056_predicate_optimizer_bugs.reference
index fd9d96bdf5f..4227af86be7 100644
--- a/tests/queries/0_stateless/01056_predicate_optimizer_bugs.reference
+++ b/tests/queries/0_stateless/01056_predicate_optimizer_bugs.reference
@@ -1,11 +1,11 @@
-SELECT 
+SELECT
     k,
     v,
     d,
     i
 FROM 
 (
-    SELECT 
+    SELECT
         t.1 AS k,
         t.2 AS v,
         runningDifference(v) AS d,
@@ -21,26 +21,26 @@ a	2	1	0
 a	3	1	0
 b	13	2	0
 b	15	2	0
-SELECT 
+SELECT
     co,
     co2,
     co3,
     num
 FROM 
 (
-    SELECT 
+    SELECT
         co,
         co2,
         co3,
         count() AS num
     FROM 
     (
-        SELECT 
+        SELECT
             1 AS co,
             2 AS co2,
             3 AS co3
     )
-    GROUP BY 
+    GROUP BY
         co,
         co2,
         co3
@@ -84,7 +84,7 @@ FROM
 )
 WHERE ccc > 1
 2
-SELECT 
+SELECT
     ts,
     id,
     id_b,
@@ -93,7 +93,7 @@ SELECT
     id_c
 FROM 
 (
-    SELECT 
+    SELECT
         ts,
         id,
         id_b
@@ -102,7 +102,7 @@ FROM
 ) AS a
 ALL LEFT JOIN B AS b ON b.id = id_b
 WHERE ts <= toDateTime(\'1970-01-01 03:00:00\')
-SELECT 
+SELECT
     ts AS `--a.ts`,
     id AS `--a.id`,
     id_b AS `--a.id_b`,
@@ -111,7 +111,7 @@ SELECT
     id_c AS `--b.id_c`
 FROM 
 (
-    SELECT 
+    SELECT
         ts,
         id,
         id_b
@@ -137,19 +137,19 @@ FROM
 )
 WHERE arrayMap(x -> (x + 1), [dummy]) = [1]
 0
-SELECT 
+SELECT
     id,
     value,
     value_1
 FROM 
 (
-    SELECT 
+    SELECT
         1 AS id,
         2 AS value
 )
 ALL INNER JOIN 
 (
-    SELECT 
+    SELECT
         1 AS id,
         3 AS value_1
 ) USING (id)
diff --git a/tests/queries/0_stateless/01076_predicate_optimizer_with_view.reference b/tests/queries/0_stateless/01076_predicate_optimizer_with_view.reference
index d6426f679c5..dfab41b5e4c 100644
--- a/tests/queries/0_stateless/01076_predicate_optimizer_with_view.reference
+++ b/tests/queries/0_stateless/01076_predicate_optimizer_with_view.reference
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     date,
     id,
     name,
@@ -10,7 +10,7 @@ FROM
     HAVING id = 1
 ) AS test_view
 WHERE id = 1
-SELECT 
+SELECT
     date,
     id,
     name,
diff --git a/tests/queries/0_stateless/01083_cross_to_inner_with_like.reference b/tests/queries/0_stateless/01083_cross_to_inner_with_like.reference
index 5491e82c7d3..42bbeb05ecb 100644
--- a/tests/queries/0_stateless/01083_cross_to_inner_with_like.reference
+++ b/tests/queries/0_stateless/01083_cross_to_inner_with_like.reference
@@ -1,18 +1,18 @@
-SELECT 
+SELECT
     k,
     r.k,
     name
 FROM n
 ALL INNER JOIN r ON k = r.k
 WHERE (k = r.k) AND (name = \'A\')
-SELECT 
+SELECT
     k,
     r.k,
     name
 FROM n
 ALL INNER JOIN r ON k = r.k
 WHERE (k = r.k) AND (name LIKE \'A%\')
-SELECT 
+SELECT
     k,
     r.k,
     name
diff --git a/tests/queries/0_stateless/01117_chain_finalize_bug.sql b/tests/queries/0_stateless/01117_chain_finalize_bug.sql
index f79f82b8d4d..273b742d0bd 100644
--- a/tests/queries/0_stateless/01117_chain_finalize_bug.sql
+++ b/tests/queries/0_stateless/01117_chain_finalize_bug.sql
@@ -14,7 +14,7 @@ SET group_by_two_level_threshold = 2;
 
 SELECT count() FROM
 (
-    SELECT 
+    SELECT
         arrayJoin(arrayMap(i -> (i + 1), range(2))) AS index, 
         number
     FROM numbers_mt(100000)
diff --git a/tests/queries/0_stateless/01250_fixed_string_comparison.sql b/tests/queries/0_stateless/01250_fixed_string_comparison.sql
index 8481b3572bb..d574fd082f0 100644
--- a/tests/queries/0_stateless/01250_fixed_string_comparison.sql
+++ b/tests/queries/0_stateless/01250_fixed_string_comparison.sql
@@ -1,5 +1,5 @@
 WITH 'abb' AS b, 'abc' AS c, 'abd' AS d, toFixedString(b, 5) AS bf, toFixedString(c, 5) AS cf, toFixedString(d, 5) AS df
-SELECT 
+SELECT
     b = b, b > b, b < b,
     b = c, b > c, b < c,
     b = d, b > d, b < d,
diff --git a/tests/queries/0_stateless/01271_optimize_arithmetic_operations_in_aggr_func.reference b/tests/queries/0_stateless/01271_optimize_arithmetic_operations_in_aggr_func.reference
index eeba2646046..669221005f4 100644
--- a/tests/queries/0_stateless/01271_optimize_arithmetic_operations_in_aggr_func.reference
+++ b/tests/queries/0_stateless/01271_optimize_arithmetic_operations_in_aggr_func.reference
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     sum(n + 1),
     sum(1 + n),
     sum(n - 1),
@@ -8,7 +8,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(n) * 2,
     2 * sum(n),
     sum(n) / 2,
@@ -18,7 +18,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(n) + 1,
     1 + min(n),
     min(n) - 1,
@@ -28,7 +28,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(n) * 2,
     2 * min(n),
     min(n) / 2,
@@ -38,7 +38,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(n) + 1,
     1 + max(n),
     max(n) - 1,
@@ -48,7 +48,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(n) * 2,
     2 * max(n),
     max(n) / 2,
@@ -58,7 +58,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(n + -1),
     sum(-1 + n),
     sum(n - -1),
@@ -68,7 +68,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(n) * -2,
     -2 * sum(n),
     sum(n) / -2,
@@ -78,7 +78,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(n) + -1,
     -1 + min(n),
     min(n) - -1,
@@ -88,7 +88,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(n) * -2,
     -2 * max(n),
     max(n) / -2,
@@ -98,7 +98,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(n) + -1,
     -1 + max(n),
     max(n) - -1,
@@ -108,7 +108,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(n) * -2,
     -2 * min(n),
     min(n) / -2,
@@ -118,7 +118,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(abs(2) + 1),
     sum(abs(2) + n),
     sum(n - abs(2)),
@@ -128,7 +128,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(abs(2)) * 2,
     sum(abs(2) * n),
     sum(n / abs(2)),
@@ -138,7 +138,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(abs(2)) + 1,
     min(abs(2) + n),
     min(n - abs(2)),
@@ -148,7 +148,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(abs(2)) * 2,
     min(abs(2) * n),
     min(n / abs(2)),
@@ -158,7 +158,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(abs(2)) + 1,
     max(abs(2) + n),
     max(n - abs(2)),
@@ -168,7 +168,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(abs(2)) * 2,
     max(abs(2) * n),
     max(n / abs(2)),
@@ -178,7 +178,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(abs(n) + 1),
     sum(abs(n) + n),
     sum(n - abs(n)),
@@ -188,7 +188,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(abs(n)) * 2,
     sum(abs(n) * n),
     sum(n / abs(n)),
@@ -198,7 +198,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(abs(n)) + 1,
     min(abs(n) + n),
     min(n - abs(n)),
@@ -208,7 +208,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(abs(n)) * 2,
     min(abs(n) * n),
     min(n / abs(n)),
@@ -218,7 +218,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(abs(n)) + 1,
     max(abs(n) + n),
     max(n - abs(n)),
@@ -228,7 +228,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(abs(n)) * 2,
     max(abs(n) * n),
     max(n / abs(n)),
@@ -238,7 +238,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum((n * n) + 1),
     sum(1 + (n * n)),
     sum((n * n) - 1),
@@ -248,7 +248,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(n * n) * 2,
     sum((2 * n) * n),
     sum(n * n) / 2,
@@ -258,7 +258,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(n * n) + 1,
     1 + min(n * n),
     min(n * n) - 1,
@@ -268,7 +268,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     min(n * n) * 2,
     min((2 * n) * n),
     min(n * n) / 2,
@@ -278,7 +278,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(n * n) + 1,
     1 + max(n * n),
     max(n * n) - 1,
@@ -288,7 +288,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     max(n * n) * 2,
     max((2 * n) * n),
     max(n * n) / 2,
@@ -298,7 +298,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum((1 + n) + 1),
     sum((1 + 1) + n),
     sum((1 + n) - 1),
@@ -308,7 +308,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum(1 + (n * 2)),
     sum(1 + (2 * n)),
     sum(1 + (n / 2)),
@@ -318,7 +318,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     (1 + min(n)) + 1,
     min((1 + 1) + n),
     (1 + min(n)) - 1,
@@ -328,7 +328,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     1 + min(n * 2),
     1 + min(2 * n),
     1 + min(n / 2),
@@ -338,7 +338,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     (1 + max(n)) + 1,
     max((1 + 1) + n),
     (1 + max(n)) - 1,
@@ -348,7 +348,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     1 + max(n * 2),
     1 + max(2 * n),
     1 + max(n / 2),
@@ -358,7 +358,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     sum((n + -1) + -1),
     sum((-1 + n) + -1),
     sum((n - -1) + -1),
@@ -368,7 +368,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     (sum(n) * -2) * -1,
     (-2 * sum(n)) * -1,
     (sum(n) / -2) / -1,
@@ -378,7 +378,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     (min(n) + -1) + -1,
     (-1 + min(n)) + -1,
     (min(n) - -1) + -1,
@@ -388,7 +388,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     (min(n) * -2) * -1,
     (-2 * min(n)) * -1,
     (min(n) / -2) / -1,
@@ -398,7 +398,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     (max(n) + -1) + -1,
     (-1 + max(n)) + -1,
     (max(n) - -1) + -1,
@@ -408,7 +408,7 @@ FROM
     SELECT number AS n
     FROM numbers(10)
 )
-SELECT 
+SELECT
     (max(n) * -2) * -1,
     (-2 * max(n)) * -1,
     (max(n) / -2) / -1,
diff --git a/tests/queries/0_stateless/01272_totals_and_filter_bug.sql b/tests/queries/0_stateless/01272_totals_and_filter_bug.sql
index a6082ae9f11..de751eb73bd 100644
--- a/tests/queries/0_stateless/01272_totals_and_filter_bug.sql
+++ b/tests/queries/0_stateless/01272_totals_and_filter_bug.sql
@@ -8,13 +8,13 @@ CREATE TABLE bar (server_date Date, dimension_1 String, metric_2 UInt32) ENGINE
 INSERT INTO foo VALUES ('2020-01-01', 'test1', 10), ('2020-01-01', 'test2', 20);
 INSERT INTO bar VALUES ('2020-01-01', 'test2', 30), ('2020-01-01', 'test3', 40);
 
-SELECT 
+SELECT
     dimension_1, 
     sum_metric_1, 
     sum_metric_2
 FROM 
 (
-    SELECT 
+    SELECT
         dimension_1, 
         sum(metric_1) AS sum_metric_1
     FROM foo
@@ -23,7 +23,7 @@ FROM
 ) AS subquery_1
 ALL FULL OUTER JOIN 
 (
-    SELECT 
+    SELECT
         dimension_1, 
         sum(metric_2) AS sum_metric_2
     FROM bar
diff --git a/tests/queries/0_stateless/01278_format_multiple_queries.reference b/tests/queries/0_stateless/01278_format_multiple_queries.reference
index b12e3b30f0c..001b10b0990 100644
--- a/tests/queries/0_stateless/01278_format_multiple_queries.reference
+++ b/tests/queries/0_stateless/01278_format_multiple_queries.reference
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     a,
     b AS x
 FROM table AS t
@@ -6,7 +6,7 @@ INNER JOIN table2 AS t2 ON t.id = t2.t_id
 WHERE 1 = 1
 ;
 
-SELECT 
+SELECT
     a,
     b AS x,
     if(x = 0, a, b)
diff --git a/tests/queries/0_stateless/01300_group_by_other_keys.reference b/tests/queries/0_stateless/01300_group_by_other_keys.reference
index bd2372dca93..1db34d884a3 100644
--- a/tests/queries/0_stateless/01300_group_by_other_keys.reference
+++ b/tests/queries/0_stateless/01300_group_by_other_keys.reference
@@ -24,7 +24,7 @@
 3465735.9028
 SELECT max(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 2,
     number % 3,
     ((number % 2) + (number % 3)) % 2
@@ -35,19 +35,19 @@ GROUP BY number % 5
 ORDER BY k ASC
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     (number % 2) * (number % 3),
     number % 3
 ORDER BY k ASC
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 3,
     number % 2
 ORDER BY k ASC
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     (number % 2) % 3,
     number % 2
 ORDER BY k ASC
@@ -77,33 +77,33 @@ ORDER BY k ASC
 3465735.9028
 SELECT max(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 2,
     number % 3,
     ((number % 2) + (number % 3)) % 2
 ORDER BY k ASC
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 5,
     (number % 5) * (number % 5)
 ORDER BY k ASC
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     (number % 2) * (number % 3),
     number % 3
 ORDER BY k ASC
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     (number % 2) * (number % 3),
     number % 3,
     number % 2
 ORDER BY k ASC
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     (number % 2) % 3,
     number % 2
 ORDER BY k ASC
diff --git a/tests/queries/0_stateless/01300_group_by_other_keys_having.reference b/tests/queries/0_stateless/01300_group_by_other_keys_having.reference
index 0bec0ebdf9b..a470c19a244 100644
--- a/tests/queries/0_stateless/01300_group_by_other_keys_having.reference
+++ b/tests/queries/0_stateless/01300_group_by_other_keys_having.reference
@@ -9,7 +9,7 @@
 4
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 3,
     number % 2
 HAVING avg(log(2) * number) > 3465735.3
@@ -35,7 +35,7 @@ ORDER BY k ASC
 4
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     (number % 2) * (number % 3),
     number % 3,
     number % 2
@@ -44,14 +44,14 @@ ORDER BY k ASC
 SELECT avg(log(2) * number) AS k
 FROM numbers(10000000)
 WHERE ((number % 5) * (number % 5)) < 5
-GROUP BY 
+GROUP BY
     number % 5,
     (number % 5) * (number % 5)
 ORDER BY k ASC
 SELECT (number % 5) * (number % 5) AS k
 FROM numbers(10000000)
 WHERE ((number % 5) * (number % 5)) < 5
-GROUP BY 
+GROUP BY
     number % 5,
     (number % 5) * (number % 5)
 ORDER BY k ASC
diff --git a/tests/queries/0_stateless/01321_aggregate_functions_of_group_by_keys.reference b/tests/queries/0_stateless/01321_aggregate_functions_of_group_by_keys.reference
index 875a6753f84..92d6e5c37e6 100644
--- a/tests/queries/0_stateless/01321_aggregate_functions_of_group_by_keys.reference
+++ b/tests/queries/0_stateless/01321_aggregate_functions_of_group_by_keys.reference
@@ -47,29 +47,29 @@
 24
 0
 0
-SELECT 
+SELECT
     number % 2 AS a,
     number % 3 AS b
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 2,
     number % 3
-ORDER BY 
+ORDER BY
     min(number % 2) AS a ASC,
     max(number % 3) AS b ASC
-SELECT 
+SELECT
     number % 2 AS a,
     number % 3 AS b
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 2,
     number % 3
-ORDER BY 
+ORDER BY
     any(number % 2) AS a ASC,
     anyLast(number % 3) AS b ASC
 SELECT (number % 5) * (number % 7) AS a
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 7,
     number % 5
 ORDER BY max((number % 5) * (number % 7)) AS a ASC
@@ -128,29 +128,29 @@ FROM
 20
 24
 0
-SELECT 
+SELECT
     min(number % 2) AS a,
     max(number % 3) AS b
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 2,
     number % 3
-ORDER BY 
+ORDER BY
     a ASC,
     b ASC
-SELECT 
+SELECT
     any(number % 2) AS a,
     anyLast(number % 3) AS b
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 2,
     number % 3
-ORDER BY 
+ORDER BY
     a ASC,
     b ASC
 SELECT max((number % 5) * (number % 7)) AS a
 FROM numbers(10000000)
-GROUP BY 
+GROUP BY
     number % 7,
     number % 5
 ORDER BY a ASC
diff --git a/tests/queries/0_stateless/01321_monotonous_functions_in_order_by.reference b/tests/queries/0_stateless/01321_monotonous_functions_in_order_by.reference
index e8e7d754ed9..ffa91586f35 100644
--- a/tests/queries/0_stateless/01321_monotonous_functions_in_order_by.reference
+++ b/tests/queries/0_stateless/01321_monotonous_functions_in_order_by.reference
@@ -54,12 +54,12 @@ FROM numbers(3)
 ORDER BY exp(number) ASC
 SELECT roundToExp2(number) AS x
 FROM numbers(3)
-ORDER BY 
+ORDER BY
     number ASC,
     number ASC
 SELECT number AS x
 FROM numbers(3)
-ORDER BY 
+ORDER BY
     number ASC,
     number ASC
 SELECT number
@@ -79,7 +79,7 @@ FROM numbers(3)
 ORDER BY exp(number) DESC
 SELECT roundToExp2(number) AS x
 FROM numbers(3)
-ORDER BY 
+ORDER BY
     number DESC,
     number DESC
 0
@@ -138,12 +138,12 @@ FROM numbers(3)
 ORDER BY exp(number) ASC
 SELECT roundToExp2(number) AS x
 FROM numbers(3)
-ORDER BY 
+ORDER BY
     x ASC,
     toFloat32(x) ASC
 SELECT number AS x
 FROM numbers(3)
-ORDER BY 
+ORDER BY
     toFloat32(x) AS k ASC,
     toFloat64(k) ASC
 SELECT number
@@ -163,6 +163,6 @@ FROM numbers(3)
 ORDER BY exp(number) DESC
 SELECT roundToExp2(number) AS x
 FROM numbers(3)
-ORDER BY 
+ORDER BY
     x DESC,
     toFloat32(x) DESC
diff --git a/tests/queries/0_stateless/01322_any_input_optimize.reference b/tests/queries/0_stateless/01322_any_input_optimize.reference
index c02c9fbeae4..f88f2f5937c 100644
--- a/tests/queries/0_stateless/01322_any_input_optimize.reference
+++ b/tests/queries/0_stateless/01322_any_input_optimize.reference
@@ -8,7 +8,7 @@ WITH any(number) * 3 AS x
 SELECT x
 FROM numbers(1, 2)
 3
-SELECT 
+SELECT
     anyLast(number) * 3 AS x,
     x
 FROM numbers(1, 2)
@@ -23,7 +23,7 @@ WITH any(number * 3) AS x
 SELECT x
 FROM numbers(1, 2)
 3
-SELECT 
+SELECT
     anyLast(number * 3) AS x,
     x
 FROM numbers(1, 2)
diff --git a/tests/queries/0_stateless/01323_redundant_functions_in_order_by.reference b/tests/queries/0_stateless/01323_redundant_functions_in_order_by.reference
index 8751f269c4a..fd52438e9b0 100644
--- a/tests/queries/0_stateless/01323_redundant_functions_in_order_by.reference
+++ b/tests/queries/0_stateless/01323_redundant_functions_in_order_by.reference
@@ -34,11 +34,11 @@ FROM
 (
     SELECT number AS x
     FROM numbers(3)
-    ORDER BY 
+    ORDER BY
         exp(x) ASC,
         x ASC
 )
-SELECT 
+SELECT
     key,
     a,
     b,
@@ -49,17 +49,17 @@ FROM
     FROM numbers(4)
 ) AS s
 ALL FULL OUTER JOIN test AS t USING (key)
-ORDER BY 
+ORDER BY
     key ASC,
     t.key ASC
-SELECT 
+SELECT
     key,
     a
 FROM test
-ORDER BY 
+ORDER BY
     key ASC,
     a ASC
-SELECT 
+SELECT
     key,
     a
 FROM test
@@ -86,7 +86,7 @@ FROM
 (
     SELECT number AS x
     FROM numbers(3)
-    ORDER BY 
+    ORDER BY
         x ASC,
         exp(x) ASC
 )
@@ -95,7 +95,7 @@ FROM
 (
     SELECT number AS x
     FROM numbers(3)
-    ORDER BY 
+    ORDER BY
         x ASC,
         exp(exp(x)) ASC
 )
@@ -104,11 +104,11 @@ FROM
 (
     SELECT number AS x
     FROM numbers(3)
-    ORDER BY 
+    ORDER BY
         exp(x) ASC,
         x ASC
 )
-SELECT 
+SELECT
     key,
     a,
     b,
@@ -119,21 +119,21 @@ FROM
     FROM numbers(4)
 ) AS s
 ALL FULL OUTER JOIN test AS t USING (key)
-ORDER BY 
+ORDER BY
     key ASC,
     t.key ASC
-SELECT 
+SELECT
     key,
     a
 FROM test
-ORDER BY 
+ORDER BY
     key ASC,
     a ASC,
     exp(key + a) ASC
-SELECT 
+SELECT
     key,
     a
 FROM test
-ORDER BY 
+ORDER BY
     key ASC,
     exp(key + a) ASC
diff --git a/tests/queries/0_stateless/01355_defaultValueOfArgumentType_bug.sql b/tests/queries/0_stateless/01355_defaultValueOfArgumentType_bug.sql
index e3168eb09a0..2313cb686a4 100644
--- a/tests/queries/0_stateless/01355_defaultValueOfArgumentType_bug.sql
+++ b/tests/queries/0_stateless/01355_defaultValueOfArgumentType_bug.sql
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     materialize(toLowCardinality('')) AS lc,
     toTypeName(lc)
 WHERE lc = defaultValueOfArgumentType(lc)
diff --git a/tests/queries/0_stateless/01372_wrong_order_by_removal.reference b/tests/queries/0_stateless/01372_wrong_order_by_removal.reference
index 8ed303c04aa..f1f1bcef6e5 100644
--- a/tests/queries/0_stateless/01372_wrong_order_by_removal.reference
+++ b/tests/queries/0_stateless/01372_wrong_order_by_removal.reference
@@ -1,14 +1,14 @@
-SELECT 
+SELECT
     k,
     groupArrayMovingSum(v)
 FROM 
 (
-    SELECT 
+    SELECT
         k,
         dt,
         v
     FROM moving_sum_num
-    ORDER BY 
+    ORDER BY
         k ASC,
         dt ASC
 )
diff --git a/tests/queries/0_stateless/01379_with_fill_several_columns.sql b/tests/queries/0_stateless/01379_with_fill_several_columns.sql
index 5d1cb4e6828..f98431b61b9 100644
--- a/tests/queries/0_stateless/01379_with_fill_several_columns.sql
+++ b/tests/queries/0_stateless/01379_with_fill_several_columns.sql
@@ -1,21 +1,21 @@
-SELECT 
+SELECT
     toDate((number * 10) * 86400) AS d1, 
     toDate(number * 86400) AS d2, 
     'original' AS source
 FROM numbers(10)
 WHERE (number % 3) = 1
-ORDER BY 
+ORDER BY
     d2 WITH FILL, 
     d1 WITH FILL STEP 5;
 
 SELECT '===============';
 
-SELECT 
+SELECT
     toDate((number * 10) * 86400) AS d1, 
     toDate(number * 86400) AS d2, 
     'original' AS source
 FROM numbers(10)
 WHERE (number % 3) = 1
-ORDER BY 
+ORDER BY
     d1 WITH FILL STEP 5,
     d2 WITH FILL;
\ No newline at end of file
diff --git a/tests/queries/0_stateless/01390_remove_injective_in_uniq.reference b/tests/queries/0_stateless/01390_remove_injective_in_uniq.reference
index 8fe2933b95e..94e1dbc5da7 100644
--- a/tests/queries/0_stateless/01390_remove_injective_in_uniq.reference
+++ b/tests/queries/0_stateless/01390_remove_injective_in_uniq.reference
@@ -1,4 +1,4 @@
-SELECT 
+SELECT
     uniq(x),
     uniqExact(x),
     uniqHLL12(x),
@@ -9,7 +9,7 @@ FROM
     SELECT number % 2 AS x
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(x + y),
     uniqExact(x + y),
     uniqHLL12(x + y),
@@ -17,12 +17,12 @@ SELECT
     uniqCombined64(x + y)
 FROM 
 (
-    SELECT 
+    SELECT
         number % 2 AS x,
         number % 3 AS y
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(x),
     uniqExact(x),
     uniqHLL12(x),
@@ -33,7 +33,7 @@ FROM
     SELECT number % 2 AS x
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(x),
     uniqExact(x),
     uniqHLL12(x),
@@ -44,7 +44,7 @@ FROM
     SELECT number % 2 AS x
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(x),
     uniqExact(x),
     uniqHLL12(x),
@@ -55,7 +55,7 @@ FROM
     SELECT number % 2 AS x
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(x),
     uniqExact(x),
     uniqHLL12(x),
@@ -74,7 +74,7 @@ FROM
 )
 SELECT uniq(concatAssumeInjective(\'x\', \'y\'))
 FROM numbers(10)
-SELECT 
+SELECT
     uniq(x),
     uniqExact(x),
     uniqHLL12(x),
@@ -85,7 +85,7 @@ FROM
     SELECT number % 2 AS x
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(x + y),
     uniqExact(x + y),
     uniqHLL12(x + y),
@@ -93,12 +93,12 @@ SELECT
     uniqCombined64(x + y)
 FROM 
 (
-    SELECT 
+    SELECT
         number % 2 AS x,
         number % 3 AS y
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(-x),
     uniqExact(-x),
     uniqHLL12(-x),
@@ -109,7 +109,7 @@ FROM
     SELECT number % 2 AS x
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(bitNot(x)),
     uniqExact(bitNot(x)),
     uniqHLL12(bitNot(x)),
@@ -120,7 +120,7 @@ FROM
     SELECT number % 2 AS x
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(bitNot(-x)),
     uniqExact(bitNot(-x)),
     uniqHLL12(bitNot(-x)),
@@ -131,7 +131,7 @@ FROM
     SELECT number % 2 AS x
     FROM numbers(10)
 )
-SELECT 
+SELECT
     uniq(-bitNot(-x)),
     uniqExact(-bitNot(-x)),
     uniqHLL12(-bitNot(-x)),
diff --git a/tests/queries/0_stateless/01414_push_predicate_when_contains_with_clause.reference b/tests/queries/0_stateless/01414_push_predicate_when_contains_with_clause.reference
index a2ee0336191..13c8fe551c7 100644
--- a/tests/queries/0_stateless/01414_push_predicate_when_contains_with_clause.reference
+++ b/tests/queries/0_stateless/01414_push_predicate_when_contains_with_clause.reference
@@ -1,12 +1,12 @@
 999	1998
 999	1998
-SELECT 
+SELECT
     number,
     square_number
 FROM 
 (
     WITH number * 2 AS square_number
-    SELECT 
+    SELECT
         number,
         square_number
     FROM numbers_indexed
diff --git a/tests/queries/0_stateless/01418_index_analysis_bug.sql b/tests/queries/0_stateless/01418_index_analysis_bug.sql
index c5033ac7d96..aae76b63b7d 100644
--- a/tests/queries/0_stateless/01418_index_analysis_bug.sql
+++ b/tests/queries/0_stateless/01418_index_analysis_bug.sql
@@ -9,13 +9,13 @@ ENGINE = MergeTree()
 PARTITION BY toYYYYMM(eventday)
 ORDER BY (eventday, user_id);
 
-INSERT INTO mytable_local SELECT 
+INSERT INTO mytable_local SELECT
     toDateTime('2020-06-01 00:00:00') + toIntervalMinute(number) AS created,
     toDate(created) AS eventday,
     if((number % 100) > 50, 742522, number % 32141) AS user_id
 FROM numbers(100000);
 
-SELECT 
+SELECT
     eventday,
     count(*)
 FROM mytable_local
diff --git a/tests/queries/0_stateless/01455_duplicate_distinct_optimization.reference b/tests/queries/0_stateless/01455_duplicate_distinct_optimization.reference
index c5a06ca0cd3..2c54899f9f5 100644
--- a/tests/queries/0_stateless/01455_duplicate_distinct_optimization.reference
+++ b/tests/queries/0_stateless/01455_duplicate_distinct_optimization.reference
@@ -9,7 +9,7 @@ FROM
 SELECT DISTINCT number * 2
 FROM 
 (
-    SELECT DISTINCT 
+    SELECT DISTINCT
         number * 2,
         number
     FROM numbers(1)
@@ -20,12 +20,12 @@ FROM
     SELECT DISTINCT number * 2 AS number
     FROM numbers(1)
 )
-SELECT 
+SELECT
     b,
     a
 FROM 
 (
-    SELECT DISTINCT 
+    SELECT DISTINCT
         number % 2 AS a,
         number % 3 AS b
     FROM numbers(100)
@@ -33,7 +33,7 @@ FROM
 SELECT DISTINCT a
 FROM 
 (
-    SELECT DISTINCT 
+    SELECT DISTINCT
         number % 2 AS a,
         number % 3 AS b
     FROM numbers(100)
@@ -44,7 +44,7 @@ FROM
     SELECT DISTINCT a
     FROM 
     (
-        SELECT DISTINCT 
+        SELECT DISTINCT
             number % 2 AS a,
             number % 3 AS b
         FROM numbers(100)
@@ -53,45 +53,45 @@ FROM
 SELECT DISTINCT a
 FROM 
 (
-    SELECT 
+    SELECT
         a,
         b
     FROM 
     (
-        SELECT DISTINCT 
+        SELECT DISTINCT
             number % 2 AS a,
             number % 3 AS b
         FROM numbers(100)
     )
 )
-SELECT 
+SELECT
     a,
     b
 FROM 
 (
-    SELECT 
+    SELECT
         b,
         a
     FROM 
     (
-        SELECT DISTINCT 
+        SELECT DISTINCT
             number AS a,
             number AS b
         FROM numbers(1)
     )
 )
-SELECT 
+SELECT
     a,
     b
 FROM 
 (
-    SELECT 
+    SELECT
         b,
         a,
         a + b
     FROM 
     (
-        SELECT DISTINCT 
+        SELECT DISTINCT
             number % 2 AS a,
             number % 3 AS b
         FROM numbers(100)
@@ -103,7 +103,7 @@ FROM
     SELECT a
     FROM 
     (
-        SELECT DISTINCT 
+        SELECT DISTINCT
             number % 2 AS a,
             number % 3 AS b
         FROM numbers(100)
diff --git a/tests/queries/0_stateless/01470_columns_transformers.reference b/tests/queries/0_stateless/01470_columns_transformers.reference
index 595d99b917f..c0f02e51ccf 100644
--- a/tests/queries/0_stateless/01470_columns_transformers.reference
+++ b/tests/queries/0_stateless/01470_columns_transformers.reference
@@ -9,54 +9,54 @@
 222	18	347
 111	11	173.5
 1970-04-11	1970-01-11	1970-11-21
-SELECT 
+SELECT
     sum(i),
     sum(j),
     sum(k)
 FROM columns_transformers
-SELECT 
+SELECT
     avg(i),
     avg(j),
     avg(k)
 FROM columns_transformers
-SELECT 
+SELECT
     toDate(any(i)),
     toDate(any(j)),
     toDate(any(k))
 FROM columns_transformers AS a
-SELECT 
+SELECT
     length(toString(j)),
     length(toString(k))
 FROM columns_transformers
-SELECT 
+SELECT
     sum(j),
     sum(k)
 FROM columns_transformers
-SELECT 
+SELECT
     avg(i),
     avg(k)
 FROM columns_transformers
-SELECT 
+SELECT
     toDate(any(i)),
     toDate(any(j)),
     toDate(any(k))
 FROM columns_transformers AS a
-SELECT 
+SELECT
     sum(i + 1 AS i),
     sum(j),
     sum(k)
 FROM columns_transformers
-SELECT 
+SELECT
     avg(i + 1 AS i),
     avg(j + 2 AS j),
     avg(k)
 FROM columns_transformers
-SELECT 
+SELECT
     toDate(any(i)),
     toDate(any(j)),
     toDate(any(k))
 FROM columns_transformers AS a
-SELECT 
+SELECT
     (i + 1) + 1 AS i,
     j,
     k
diff --git a/tests/queries/1_stateful/00063_loyalty_joins.sql b/tests/queries/1_stateful/00063_loyalty_joins.sql
index b2491346673..7713c65838c 100644
--- a/tests/queries/1_stateful/00063_loyalty_joins.sql
+++ b/tests/queries/1_stateful/00063_loyalty_joins.sql
@@ -1,12 +1,12 @@
 SET any_join_distinct_right_table_keys = 1;
 SET joined_subquery_requires_alias = 0;
 
-SELECT 
+SELECT
     loyalty, 
     count()
 FROM test.hits ANY LEFT JOIN 
 (
-    SELECT 
+    SELECT
         UserID, 
         sum(SearchEngineID = 2) AS yandex, 
         sum(SearchEngineID = 3) AS google, 
@@ -20,7 +20,7 @@ GROUP BY loyalty
 ORDER BY loyalty ASC;
 
 
-SELECT 
+SELECT
     loyalty, 
     count()
 FROM 
@@ -29,7 +29,7 @@ FROM
     FROM test.hits
 ) ANY LEFT JOIN 
 (
-    SELECT 
+    SELECT
         UserID, 
         sum(SearchEngineID = 2) AS yandex, 
         sum(SearchEngineID = 3) AS google, 
@@ -43,12 +43,12 @@ GROUP BY loyalty
 ORDER BY loyalty ASC;
 
 
-SELECT 
+SELECT
     loyalty, 
     count()
 FROM 
 (
-    SELECT 
+    SELECT
         loyalty, 
         UserID
     FROM 
@@ -57,7 +57,7 @@ FROM
         FROM test.hits
     ) ANY LEFT JOIN 
     (
-        SELECT 
+        SELECT
             UserID, 
             sum(SearchEngineID = 2) AS yandex, 
             sum(SearchEngineID = 3) AS google, 
@@ -72,18 +72,18 @@ GROUP BY loyalty
 ORDER BY loyalty ASC;
 
 
-SELECT 
+SELECT
     loyalty, 
     count() AS c, 
     bar(log(c + 1) * 1000, 0, log(3000000) * 1000, 80)
 FROM test.hits ANY INNER JOIN 
 (
-    SELECT 
+    SELECT
         UserID, 
         toInt8(if(yandex > google, yandex / (yandex + google), -google / (yandex + google)) * 10) AS loyalty
     FROM 
     (
-        SELECT 
+        SELECT
             UserID, 
             sum(SearchEngineID = 2) AS yandex, 
             sum(SearchEngineID = 3) AS google

From 11ba7049c0ad5be7aee7d6e96a73b375c8ab3b99 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 8 Sep 2020 23:33:08 +0300
Subject: [PATCH 061/341] Cover WITH format

---
 tests/queries/0_stateless/01471_with_format.reference | 6 ++++++
 tests/queries/0_stateless/01471_with_format.sql       | 2 ++
 2 files changed, 8 insertions(+)
 create mode 100644 tests/queries/0_stateless/01471_with_format.reference
 create mode 100644 tests/queries/0_stateless/01471_with_format.sql

diff --git a/tests/queries/0_stateless/01471_with_format.reference b/tests/queries/0_stateless/01471_with_format.reference
new file mode 100644
index 00000000000..806ec312bb4
--- /dev/null
+++ b/tests/queries/0_stateless/01471_with_format.reference
@@ -0,0 +1,6 @@
+WITH 1
+SELECT 1
+WITH
+    1,
+    2
+SELECT 1
diff --git a/tests/queries/0_stateless/01471_with_format.sql b/tests/queries/0_stateless/01471_with_format.sql
new file mode 100644
index 00000000000..60f6fe4135a
--- /dev/null
+++ b/tests/queries/0_stateless/01471_with_format.sql
@@ -0,0 +1,2 @@
+EXPLAIN SYNTAX WITH 1 SELECT 1;
+EXPLAIN SYNTAX WITH 1, 2 SELECT 1;

From 68c441e07b0072d7ffcd71491dcee219b2d90b62 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 8 Sep 2020 23:54:46 +0300
Subject: [PATCH 062/341] Add LIMIT BY format test

---
 .../0_stateless/01471_limit_by_format.reference        | 10 ++++++++++
 tests/queries/0_stateless/01471_limit_by_format.sql    |  2 ++
 2 files changed, 12 insertions(+)
 create mode 100644 tests/queries/0_stateless/01471_limit_by_format.reference
 create mode 100644 tests/queries/0_stateless/01471_limit_by_format.sql

diff --git a/tests/queries/0_stateless/01471_limit_by_format.reference b/tests/queries/0_stateless/01471_limit_by_format.reference
new file mode 100644
index 00000000000..aeab30435c0
--- /dev/null
+++ b/tests/queries/0_stateless/01471_limit_by_format.reference
@@ -0,0 +1,10 @@
+SELECT dummy
+FROM system.one
+LIMIT 1 BY dummy
+LIMIT 1
+SELECT dummy
+FROM system.one
+LIMIT 1 BY
+    0 + dummy,
+    0 - dummy
+LIMIT 1
diff --git a/tests/queries/0_stateless/01471_limit_by_format.sql b/tests/queries/0_stateless/01471_limit_by_format.sql
new file mode 100644
index 00000000000..a58099a223a
--- /dev/null
+++ b/tests/queries/0_stateless/01471_limit_by_format.sql
@@ -0,0 +1,2 @@
+EXPLAIN SYNTAX SELECT * FROM system.one LIMIT 1 BY * LIMIT 1;
+EXPLAIN SYNTAX SELECT * FROM system.one LIMIT 1 BY 0+dummy, 0-dummy LIMIT 1;

From bee629c971d8f5add8fe4f205aa30f8f4e66375f Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitbar@yandex-team.ru>
Date: Tue, 8 Sep 2020 02:08:42 +0300
Subject: [PATCH 063/341] Use join() instead of detach() for the
 lists_writing_thread in DiskAccessStorage.

---
 src/Access/DiskAccessStorage.cpp | 47 ++++++++++++++------------------
 src/Access/DiskAccessStorage.h   |  5 ++--
 2 files changed, 22 insertions(+), 30 deletions(-)

diff --git a/src/Access/DiskAccessStorage.cpp b/src/Access/DiskAccessStorage.cpp
index fc80859885d..6162e4aacc2 100644
--- a/src/Access/DiskAccessStorage.cpp
+++ b/src/Access/DiskAccessStorage.cpp
@@ -426,33 +426,41 @@ bool DiskAccessStorage::writeLists()
 void DiskAccessStorage::scheduleWriteLists(EntityType type)
 {
     if (failed_to_write_lists)
-        return;
+        return; /// We don't try to write list files after the first fail.
+                /// The next restart of the server will invoke rebuilding of the list files.
 
-    bool already_scheduled = !types_of_lists_to_write.empty();
     types_of_lists_to_write.insert(type);
 
-    if (already_scheduled)
-        return;
+    if (lists_writing_thread_is_waiting)
+        return; /// If the lists' writing thread is still waiting we can update `types_of_lists_to_write` easily,
+                /// without restarting that thread.
+
+    if (lists_writing_thread.joinable())
+        lists_writing_thread.join();
 
     /// Create the 'need_rebuild_lists.mark' file.
     /// This file will be used later to find out if writing lists is successful or not.
     std::ofstream{getNeedRebuildListsMarkFilePath(directory_path)};
 
-    startListsWritingThread();
+    lists_writing_thread = ThreadFromGlobalPool{&DiskAccessStorage::listsWritingThreadFunc, this};
+    lists_writing_thread_is_waiting = true;
 }
 
 
-void DiskAccessStorage::startListsWritingThread()
+void DiskAccessStorage::listsWritingThreadFunc()
 {
-    if (lists_writing_thread.joinable())
+    std::unique_lock lock{mutex};
+
     {
-        if (!lists_writing_thread_exited)
-            return;
-        lists_writing_thread.detach();
+        /// It's better not to write the lists files too often, that's why we need
+        /// the following timeout.
+        const auto timeout = std::chrono::minutes(1);
+        SCOPE_EXIT({ lists_writing_thread_is_waiting = false; });
+        if (lists_writing_thread_should_exit.wait_for(lock, timeout) != std::cv_status::timeout)
+            return; /// The destructor requires us to exit.
     }
 
-    lists_writing_thread_exited = false;
-    lists_writing_thread = ThreadFromGlobalPool{&DiskAccessStorage::listsWritingThreadFunc, this};
+    writeLists();
 }
 
 
@@ -466,21 +474,6 @@ void DiskAccessStorage::stopListsWritingThread()
 }
 
 
-void DiskAccessStorage::listsWritingThreadFunc()
-{
-    std::unique_lock lock{mutex};
-    SCOPE_EXIT({ lists_writing_thread_exited = true; });
-
-    /// It's better not to write the lists files too often, that's why we need
-    /// the following timeout.
-    const auto timeout = std::chrono::minutes(1);
-    if (lists_writing_thread_should_exit.wait_for(lock, timeout) != std::cv_status::timeout)
-        return; /// The destructor requires us to exit.
-
-    writeLists();
-}
-
-
 /// Reads and parses all the "<id>.sql" files from a specified directory
 /// and then saves the files "users.list", "roles.list", etc. to the same directory.
 bool DiskAccessStorage::rebuildLists()
diff --git a/src/Access/DiskAccessStorage.h b/src/Access/DiskAccessStorage.h
index 11eb1c3b1ad..ed2dc8b1242 100644
--- a/src/Access/DiskAccessStorage.h
+++ b/src/Access/DiskAccessStorage.h
@@ -42,9 +42,8 @@ private:
     void scheduleWriteLists(EntityType type);
     bool rebuildLists();
 
-    void startListsWritingThread();
-    void stopListsWritingThread();
     void listsWritingThreadFunc();
+    void stopListsWritingThread();
 
     void insertNoLock(const UUID & id, const AccessEntityPtr & new_entity, bool replace_if_exists, Notifications & notifications);
     void removeNoLock(const UUID & id, Notifications & notifications);
@@ -74,7 +73,7 @@ private:
     bool failed_to_write_lists = false;                          /// Whether writing of the list files has been failed since the recent restart of the server.
     ThreadFromGlobalPool lists_writing_thread;                   /// List files are written in a separate thread.
     std::condition_variable lists_writing_thread_should_exit;    /// Signals `lists_writing_thread` to exit.
-    std::atomic<bool> lists_writing_thread_exited = false;
+    bool lists_writing_thread_is_waiting = false;
     mutable std::list<OnChangedHandler> handlers_by_type[static_cast<size_t>(EntityType::MAX)];
     mutable std::mutex mutex;
 };

From cce970e40cdf1eba81a1d34c6e692ec883d544e2 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitbar@yandex-team.ru>
Date: Tue, 8 Sep 2020 02:09:03 +0300
Subject: [PATCH 064/341] Use join() instead of detach() for loading threads in
 ExternalLoader.

---
 src/Interpreters/ExternalLoader.cpp | 29 +++++++++++++++++++++++------
 1 file changed, 23 insertions(+), 6 deletions(-)

diff --git a/src/Interpreters/ExternalLoader.cpp b/src/Interpreters/ExternalLoader.cpp
index e8df205760a..dcef36de175 100644
--- a/src/Interpreters/ExternalLoader.cpp
+++ b/src/Interpreters/ExternalLoader.cpp
@@ -893,6 +893,8 @@ private:
             cancelLoading(info);
         }
 
+        putBackFinishedThreadsToPool();
+
         /// All loadings have unique loading IDs.
         size_t loading_id = next_id_counter++;
         info.loading_id = loading_id;
@@ -914,6 +916,21 @@ private:
         }
     }
 
+    void putBackFinishedThreadsToPool()
+    {
+        for (auto loading_id : recently_finished_loadings)
+        {
+            auto it = loading_threads.find(loading_id);
+            if (it != loading_threads.end())
+            {
+                auto thread = std::move(it->second);
+                loading_threads.erase(it);
+                thread.join(); /// It's very likely that `thread` has already finished.
+            }
+        }
+        recently_finished_loadings.clear();
+    }
+
     static void cancelLoading(Info & info)
     {
         if (!info.isLoading())
@@ -1095,12 +1112,11 @@ private:
         }
         min_id_to_finish_loading_dependencies.erase(std::this_thread::get_id());
 
-        auto it = loading_threads.find(loading_id);
-        if (it != loading_threads.end())
-        {
-            it->second.detach();
-            loading_threads.erase(it);
-        }
+        /// Add `loading_id` to the list of recently finished loadings.
+        /// This list is used to later put the threads which finished loading back to the thread pool.
+        /// (We can't put the loading thread back to the thread pool immediately here because at this point
+        /// the loading thread is about to finish but it's not finished yet right now.)
+        recently_finished_loadings.push_back(loading_id);
     }
 
     /// Calculate next update time for loaded_object. Can be called without mutex locking,
@@ -1158,6 +1174,7 @@ private:
     bool always_load_everything = false;
     std::atomic<bool> enable_async_loading = false;
     std::unordered_map<size_t, ThreadFromGlobalPool> loading_threads;
+    std::vector<size_t> recently_finished_loadings;
     std::unordered_map<std::thread::id, size_t> min_id_to_finish_loading_dependencies;
     size_t next_id_counter = 1; /// should always be > 0
     mutable pcg64 rnd_engine{randomSeed()};

From 0c2ecb53d13f49437ec47d336fbf68ae9e20c2f7 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Wed, 9 Sep 2020 09:35:05 +0300
Subject: [PATCH 065/341] Update arrayIndex.h

---
 src/Functions/array/arrayIndex.h | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/Functions/array/arrayIndex.h b/src/Functions/array/arrayIndex.h
index f96eb09c861..d4695ec0af5 100644
--- a/src/Functions/array/arrayIndex.h
+++ b/src/Functions/array/arrayIndex.h
@@ -739,10 +739,6 @@ private:
         if (!col_lc)
             return false;
 
-//        assert(checkAndGetColumn<ColumnNullable>(col_lc->getDictionaryPtr().get()));
-//        assert(col_lc->isNullable());
-//        assert(isColumnNullable(*col_lc->getDictionaryPtr().get()));
-
         const auto [null_map_data, null_map_item] = getNullMaps(block, arguments);
 
         const IColumn& col_arg = *block.getByPosition(arguments[1]).column.get();

From 48bf65d63de2cacab0742f79fcfbab499dae384e Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Tue, 8 Sep 2020 23:45:04 -0700
Subject: [PATCH 066/341] StorageReplicatedMergeTree - improve integration test

---
 .../configs/remote_servers.xml                     | 14 --------------
 .../test_replicated_zk_conn_failure/test.py        | 13 +++++++++----
 2 files changed, 9 insertions(+), 18 deletions(-)
 delete mode 100644 tests/integration/test_replicated_zk_conn_failure/configs/remote_servers.xml

diff --git a/tests/integration/test_replicated_zk_conn_failure/configs/remote_servers.xml b/tests/integration/test_replicated_zk_conn_failure/configs/remote_servers.xml
deleted file mode 100644
index 538aa72d386..00000000000
--- a/tests/integration/test_replicated_zk_conn_failure/configs/remote_servers.xml
+++ /dev/null
@@ -1,14 +0,0 @@
-<yandex>
-    <remote_servers>
-        <test_cluster>
-            <shard>
-                <internal_replication>true</internal_replication>
-                <replica>
-                    <default_database>shard_0</default_database>
-                    <host>node1</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </test_cluster>
-    </remote_servers>
-</yandex>
diff --git a/tests/integration/test_replicated_zk_conn_failure/test.py b/tests/integration/test_replicated_zk_conn_failure/test.py
index 3f106bd2981..a860716ee82 100644
--- a/tests/integration/test_replicated_zk_conn_failure/test.py
+++ b/tests/integration/test_replicated_zk_conn_failure/test.py
@@ -12,11 +12,11 @@ from helpers.network import PartitionManager
 # 3. Try creating the table and there would be a Poco:Exception.
 # 4. Try creating the table again and there should not be any error
 # that indicates that the Directory for table already exists.
-
-
+# 5. Final step is to restore ZooKeeper connection and verify that
+# the table creation and queries work.
 def test_replicated_zk_conn_failure():
     cluster = ClickHouseCluster(__file__)
-    node1 = cluster.add_instance('node1', main_configs=["configs/remote_servers.xml"], with_zookeeper=True)
+    node1 = cluster.add_instance('node1', with_zookeeper=True)
     try:
         cluster.start()
         node1.query("CREATE DATABASE replica;")
@@ -27,7 +27,7 @@ def test_replicated_zk_conn_failure():
         )
         Engine=ReplicatedMergeTree('/clickhouse/tables/replica/test', 'node1')
         PARTITION BY toYYYYMMDD(event_time)
-        ORDER BY id;'''.format(replica=node1.name)
+        ORDER BY id;'''
         with PartitionManager() as pm:
             pm.drop_instance_zk_connections(node1)
             time.sleep(5)
@@ -41,5 +41,10 @@ def test_replicated_zk_conn_failure():
             # Should not expect any errors related to directory already existing
             # and those should have been already cleaned up during the previous retry.
             assert "Directory for table data data/replica/test/ already exists" not in error
+            # restore ZooKeeper connections.
+            pm.restore_instance_zk_connections(node1)
+            # retry create query and query the table created.
+            node1.query(query_create)
+            assert "0\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
     finally:
         cluster.shutdown()

From c34eaf5de3380e8b12f0f6e8b578bb13744660bf Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 10:08:38 +0300
Subject: [PATCH 067/341] Update ci_config and llvm

---
 contrib/llvm            |  2 +-
 tests/ci/ci_config.json | 26 +++++++++++++-------------
 2 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/contrib/llvm b/contrib/llvm
index 3d6c7e91676..8f24d507c1c 160000
--- a/contrib/llvm
+++ b/contrib/llvm
@@ -1 +1 @@
-Subproject commit 3d6c7e916760b395908f28a1c885c8334d4fa98b
+Subproject commit 8f24d507c1cfeec66d27f48fe74518fd278e2d25
diff --git a/tests/ci/ci_config.json b/tests/ci/ci_config.json
index 44e9df49216..adb736a8df3 100644
--- a/tests/ci/ci_config.json
+++ b/tests/ci/ci_config.json
@@ -1,7 +1,7 @@
 {
     "build_config": [
         {
-            "compiler": "gcc-9",
+            "compiler": "gcc-10",
             "build-type": "",
             "sanitizer": "",
             "package-type": "deb",
@@ -12,7 +12,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "gcc-9",
+            "compiler": "gcc-10",
             "build-type": "",
             "sanitizer": "",
             "package-type": "performance",
@@ -22,7 +22,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "gcc-9",
+            "compiler": "gcc-10",
             "build-type": "",
             "sanitizer": "",
             "package-type": "binary",
@@ -92,7 +92,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "gcc-9",
+            "compiler": "gcc-10",
             "build-type": "",
             "sanitizer": "",
             "package-type": "deb",
@@ -227,7 +227,7 @@
         },
         "Functional stateful tests (release)": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -239,7 +239,7 @@
         },
         "Functional stateful tests (release, DatabaseAtomic)": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -311,7 +311,7 @@
         },
         "Functional stateless tests (release)": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -323,7 +323,7 @@
         },
         "Functional stateless tests (unbundled)": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -335,7 +335,7 @@
         },
         "Functional stateless tests (release, polymorphic parts enabled)": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -347,7 +347,7 @@
         },
         "Functional stateless tests (release, DatabaseAtomic)": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -443,7 +443,7 @@
         },
         "Compatibility check": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -467,7 +467,7 @@
         },
         "Testflows check": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -479,7 +479,7 @@
         },
         "Unit tests release gcc": {
             "required_build_properties": {
-                "compiler": "gcc-9",
+                "compiler": "gcc-10",
                 "package_type": "binary",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",

From b40998ca007afbe702768ede9bf5776274347040 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Wed, 9 Sep 2020 15:41:38 +0800
Subject: [PATCH 068/341] Treat query as function argument.

---
 src/Interpreters/QueryNormalizer.cpp     |  2 +-
 src/Parsers/ASTFunction.cpp              | 13 +++++++++++--
 src/Parsers/ASTFunction.h                |  4 +++-
 src/Parsers/ExpressionElementParsers.cpp |  6 ++++--
 src/TableFunctions/TableFunctionView.cpp | 19 ++++++++-----------
 5 files changed, 27 insertions(+), 17 deletions(-)

diff --git a/src/Interpreters/QueryNormalizer.cpp b/src/Interpreters/QueryNormalizer.cpp
index 59233218a50..07d4888b555 100644
--- a/src/Interpreters/QueryNormalizer.cpp
+++ b/src/Interpreters/QueryNormalizer.cpp
@@ -152,7 +152,7 @@ void QueryNormalizer::visitChildren(const ASTPtr & node, Data & data)
 {
     if (const auto * func_node = node->as<ASTFunction>())
     {
-        if (func_node->query)
+        if (func_node->tryGetQueryArgument())
         {
             if (func_node->name != "view")
                 throw Exception("Query argument can only be used in the `view` TableFunction", ErrorCodes::BAD_ARGUMENTS);
diff --git a/src/Parsers/ASTFunction.cpp b/src/Parsers/ASTFunction.cpp
index 07429c8104f..bbd910ae875 100644
--- a/src/Parsers/ASTFunction.cpp
+++ b/src/Parsers/ASTFunction.cpp
@@ -48,7 +48,6 @@ ASTPtr ASTFunction::clone() const
     auto res = std::make_shared<ASTFunction>(*this);
     res->children.clear();
 
-    if (query) { res->query = query->clone(); res->children.push_back(res->query); }
     if (arguments) { res->arguments = arguments->clone(); res->children.push_back(res->arguments); }
     if (parameters) { res->parameters = parameters->clone(); res->children.push_back(res->parameters); }
 
@@ -112,6 +111,16 @@ static bool highlightStringLiteralWithMetacharacters(const ASTPtr & node, const
 }
 
 
+ASTSelectWithUnionQuery * ASTFunction::tryGetQueryArgument() const
+{
+    if (arguments && arguments->children.size() == 1)
+    {
+        return arguments->children[0]->as<ASTSelectWithUnionQuery>();
+    }
+    return nullptr;
+}
+
+
 void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const
 {
     FormatStateStacked nested_need_parens = frame;
@@ -119,7 +128,7 @@ void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, Format
     nested_need_parens.need_parens = true;
     nested_dont_need_parens.need_parens = false;
 
-    if (query)
+    if (auto * query = tryGetQueryArgument())
     {
         std::string nl_or_nothing = settings.one_line ? "" : "\n";
         std::string indent_str = settings.one_line ? "" : std::string(4u * frame.indent, ' ');
diff --git a/src/Parsers/ASTFunction.h b/src/Parsers/ASTFunction.h
index b94614426d8..3b87ab68282 100644
--- a/src/Parsers/ASTFunction.h
+++ b/src/Parsers/ASTFunction.h
@@ -2,6 +2,7 @@
 
 #include <Parsers/ASTWithAlias.h>
 #include <Parsers/ASTExpressionList.h>
+#include <Parsers/ASTSelectWithUnionQuery.h>
 
 
 namespace DB
@@ -13,7 +14,6 @@ class ASTFunction : public ASTWithAlias
 {
 public:
     String name;
-    ASTPtr query; // It's possible for a function to accept a query as its only argument.
     ASTPtr arguments;
     /// parameters - for parametric aggregate function. Example: quantile(0.9)(x) - what in first parens are 'parameters'.
     ASTPtr parameters;
@@ -26,6 +26,8 @@ public:
 
     void updateTreeHashImpl(SipHash & hash_state) const override;
 
+    ASTSelectWithUnionQuery * tryGetQueryArgument() const;
+
 protected:
     void formatImplWithoutAlias(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const override;
     void appendColumnNameImpl(WriteBuffer & ostr) const override;
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 985507071be..64e3a0363d1 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -260,8 +260,10 @@ bool ParserFunction::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
                 ++pos;
                 auto function_node = std::make_shared<ASTFunction>();
                 tryGetIdentifierNameInto(identifier, function_node->name);
-                function_node->query = query;
-                function_node->children.push_back(function_node->query);
+                auto expr_list_with_single_query = std::make_shared<ASTExpressionList>();
+                expr_list_with_single_query->children.push_back(query);
+                function_node->arguments = expr_list_with_single_query;
+                function_node->children.push_back(function_node->arguments);
                 node = function_node;
                 return true;
             }
diff --git a/src/TableFunctions/TableFunctionView.cpp b/src/TableFunctions/TableFunctionView.cpp
index 6166fa56f47..8d3f7b06fa3 100644
--- a/src/TableFunctions/TableFunctionView.cpp
+++ b/src/TableFunctions/TableFunctionView.cpp
@@ -20,18 +20,15 @@ StoragePtr TableFunctionView::executeImpl(const ASTPtr & ast_function, const Con
 {
     if (const auto * function = ast_function->as<ASTFunction>())
     {
-        if (function->query)
+        if (auto * select = function->tryGetQueryArgument())
         {
-            if (auto * select = function->query->as<ASTSelectWithUnionQuery>())
-            {
-                auto sample = InterpreterSelectWithUnionQuery::getSampleBlock(function->query, context);
-                auto columns = ColumnsDescription(sample.getNamesAndTypesList());
-                ASTCreateQuery create;
-                create.select = select;
-                auto res = StorageView::create(StorageID(getDatabaseName(), table_name), create, columns);
-                res->startup();
-                return res;
-            }
+            auto sample = InterpreterSelectWithUnionQuery::getSampleBlock(function->arguments->children[0] /* ASTPtr */, context);
+            auto columns = ColumnsDescription(sample.getNamesAndTypesList());
+            ASTCreateQuery create;
+            create.select = select;
+            auto res = StorageView::create(StorageID(getDatabaseName(), table_name), create, columns);
+            res->startup();
+            return res;
         }
     }
     throw Exception("Table function '" + getName() + "' requires a query argument.", ErrorCodes::BAD_ARGUMENTS);

From d8fce448a29eecff6e1dc77299f63c3e75f0fbbc Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Wed, 9 Sep 2020 14:20:14 +0800
Subject: [PATCH 069/341] Implement null_as_default for JSONStrings formats

---
 src/DataTypes/DataTypeNullable.cpp                   | 12 ++++++++++--
 src/DataTypes/DataTypeNullable.h                     |  2 ++
 .../Impl/JSONCompactEachRowRowInputFormat.cpp        |  7 ++++---
 .../Formats/Impl/JSONEachRowRowInputFormat.cpp       |  7 ++++---
 .../01016_input_null_as_default.reference            |  5 +++++
 .../0_stateless/01016_input_null_as_default.sh       |  8 ++++++++
 6 files changed, 33 insertions(+), 8 deletions(-)

diff --git a/src/DataTypes/DataTypeNullable.cpp b/src/DataTypes/DataTypeNullable.cpp
index 3318196b951..6e452b2759b 100644
--- a/src/DataTypes/DataTypeNullable.cpp
+++ b/src/DataTypes/DataTypeNullable.cpp
@@ -318,13 +318,20 @@ ReturnType DataTypeNullable::deserializeTextQuoted(IColumn & column, ReadBuffer
 
 void DataTypeNullable::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    safeDeserialize(column, *nested_data_type,
+    deserializeWholeText<void>(column, istr, settings, nested_data_type);
+}
+
+template <typename ReturnType>
+ReturnType DataTypeNullable::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
+                                                  const DataTypePtr & nested_data_type)
+{
+    return safeDeserialize<ReturnType>(column, *nested_data_type,
         [&istr]
         {
             return checkStringByFirstCharacterAndAssertTheRestCaseInsensitive("NULL", istr)
                 || checkStringByFirstCharacterAndAssertTheRest("ᴺᵁᴸᴸ", istr);
         },
-        [this, &istr, &settings] (IColumn & nested) { nested_data_type->deserializeAsWholeText(nested, istr, settings); });
+        [&nested_data_type, &istr, &settings] (IColumn & nested) { nested_data_type->deserializeAsWholeText(nested, istr, settings); });
 }
 
 
@@ -551,6 +558,7 @@ DataTypePtr removeNullable(const DataTypePtr & type)
 }
 
 
+template bool DataTypeNullable::deserializeWholeText<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const DataTypePtr & nested);
 template bool DataTypeNullable::deserializeTextEscaped<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const DataTypePtr & nested);
 template bool DataTypeNullable::deserializeTextQuoted<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings &, const DataTypePtr & nested);
 template bool DataTypeNullable::deserializeTextCSV<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const DataTypePtr & nested);
diff --git a/src/DataTypes/DataTypeNullable.h b/src/DataTypes/DataTypeNullable.h
index 22d403da6c4..587eecdf32e 100644
--- a/src/DataTypes/DataTypeNullable.h
+++ b/src/DataTypes/DataTypeNullable.h
@@ -103,6 +103,8 @@ public:
     /// If ReturnType is bool, check for NULL and deserialize value into non-nullable column (and return true) or insert default value of nested type (and return false)
     /// If ReturnType is void, deserialize Nullable(T)
     template <typename ReturnType = bool>
+    static ReturnType deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const DataTypePtr & nested);
+    template <typename ReturnType = bool>
     static ReturnType deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const DataTypePtr & nested);
     template <typename ReturnType = bool>
     static ReturnType deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &, const DataTypePtr & nested);
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
index eb697ce5318..49c8d29ca2f 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
@@ -205,14 +205,15 @@ void JSONCompactEachRowRowInputFormat::readField(size_t index, MutableColumns &
 
         if (yield_strings)
         {
-            // notice: null_as_default on "null" strings is not supported
-
             String str;
             readJSONString(str, in);
 
             ReadBufferFromString buf(str);
 
-            type->deserializeAsWholeText(*columns[index], buf, format_settings);
+            if (format_settings.null_as_default && !type->isNullable())
+                read_columns[index] = DataTypeNullable::deserializeWholeText(*columns[index], buf, format_settings, type);
+            else
+                type->deserializeAsWholeText(*columns[index], buf, format_settings);
         }
         else
         {
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
index 9ba82fbb009..ab775a3e7aa 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
@@ -146,14 +146,15 @@ void JSONEachRowRowInputFormat::readField(size_t index, MutableColumns & columns
 
         if (yield_strings)
         {
-            // notice: null_as_default on "null" strings is not supported
-
             String str;
             readJSONString(str, in);
 
             ReadBufferFromString buf(str);
 
-            type->deserializeAsWholeText(*columns[index], buf, format_settings);
+            if (format_settings.null_as_default && !type->isNullable())
+                read_columns[index] = DataTypeNullable::deserializeWholeText(*columns[index], buf, format_settings, type);
+            else
+                type->deserializeAsWholeText(*columns[index], buf, format_settings);
         }
         else
         {
diff --git a/tests/queries/0_stateless/01016_input_null_as_default.reference b/tests/queries/0_stateless/01016_input_null_as_default.reference
index ba9657bf16e..d7010f42d4e 100644
--- a/tests/queries/0_stateless/01016_input_null_as_default.reference
+++ b/tests/queries/0_stateless/01016_input_null_as_default.reference
@@ -18,6 +18,11 @@ JSONEachRow
 1	world	3	2019-07-23	[1,2,3]	('tuple',3.14)
 2	Hello	123	2019-06-19	[]	('test',2.71828)
 3	Hello	42	2019-06-19	[1,2,3]	('default',0.75)
+JSONStringsEachRow
+0	1	42	2019-07-22	[10,20,30]	('default',0)
+1	world	3	2019-07-23	[1,2,3]	('tuple',3.14)
+2	Hello	123	2019-06-19	[]	('test',2.71828)
+3	Hello	42	2019-06-19	[1,2,3]	('default',0.75)
 Template (Quoted)
 0	1	42	2019-07-22	[10,20,30]	('default',0)
 1	world	3	2019-07-23	[1,2,3]	('tuple',3.14)
diff --git a/tests/queries/0_stateless/01016_input_null_as_default.sh b/tests/queries/0_stateless/01016_input_null_as_default.sh
index a40287eaba8..f31e6591e97 100755
--- a/tests/queries/0_stateless/01016_input_null_as_default.sh
+++ b/tests/queries/0_stateless/01016_input_null_as_default.sh
@@ -38,6 +38,14 @@ echo '{"i": null, "s": "1", "n": null, "d": "2019-07-22", "a": [10, 20, 30], "t"
 $CLICKHOUSE_CLIENT --query="SELECT * FROM null_as_default ORDER BY i";
 $CLICKHOUSE_CLIENT --query="TRUNCATE TABLE null_as_default";
 
+echo 'JSONStringsEachRow'
+echo '{"i": "null", "s": "1", "n": "ᴺᵁᴸᴸ", "d": "2019-07-22", "a": "[10, 20, 30]", "t": "NULL"}
+{"i": "1", "s": "world", "n": "3", "d": "2019-07-23", "a": "null", "t": "('\''tuple'\'', 3.14)"}
+{"i": "2", "s": "null", "n": "123", "d": "null", "a": "[]", "t": "('\''test'\'', 2.71828)"}
+{"i": "3", "s": "null", "n": "null", "d": "null", "a": "null", "t": "null"}' | $CLICKHOUSE_CLIENT --input_format_null_as_default=1 --query="INSERT INTO null_as_default FORMAT JSONStringsEachRow";
+$CLICKHOUSE_CLIENT --query="SELECT * FROM null_as_default ORDER BY i";
+$CLICKHOUSE_CLIENT --query="TRUNCATE TABLE null_as_default";
+
 echo 'Template (Quoted)'
 echo 'NULL, '\''1'\'', null, '\''2019-07-22'\'', [10, 20, 30], NuLl
 1, '\''world'\'', 3, '\''2019-07-23'\'', NULL, ('\''tuple'\'', 3.14)

From 4ba8f8960bd4e86a57dafba6a0aa1574b66d97db Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 12:53:24 +0300
Subject: [PATCH 070/341] Increase frame-larger-than

---
 cmake/warnings.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmake/warnings.cmake b/cmake/warnings.cmake
index 2f78dc34079..aec3e46ffa6 100644
--- a/cmake/warnings.cmake
+++ b/cmake/warnings.cmake
@@ -23,7 +23,7 @@ option (WEVERYTHING "Enables -Weverything option with some exceptions. This is i
 # Control maximum size of stack frames. It can be important if the code is run in fibers with small stack size.
 # Only in release build because debug has too large stack frames.
 if ((NOT CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG") AND (NOT SANITIZE))
-    add_warning(frame-larger-than=16384)
+    add_warning(frame-larger-than=32768)
 endif ()
 
 if (COMPILER_CLANG)

From 2ea59cb0c2fc9ea25cb6029f910952903e1d0bbd Mon Sep 17 00:00:00 2001
From: hcz <h.cz@qq.com>
Date: Wed, 9 Sep 2020 17:54:41 +0800
Subject: [PATCH 071/341] Fix tests

---
 .../0_stateless/01446_json_strings_each_row.reference     | 4 ++--
 .../01448_json_compact_strings_each_row.reference         | 8 ++++----
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/01446_json_strings_each_row.reference b/tests/queries/0_stateless/01446_json_strings_each_row.reference
index 84d41095b77..812026534ea 100644
--- a/tests/queries/0_stateless/01446_json_strings_each_row.reference
+++ b/tests/queries/0_stateless/01446_json_strings_each_row.reference
@@ -16,7 +16,7 @@
 {"v1":"first","v2":"1","v3":"2","v4":"0"}
 {"v1":"second","v2":"2","v3":"0","v4":"6"}
 6
-{"v1":"first","v2":"1","v3":"2","v4":"0"}
-{"v1":"second","v2":"2","v3":"0","v4":"6"}
+{"v1":"first","v2":"1","v3":"2","v4":"8"}
+{"v1":"second","v2":"2","v3":"32","v4":"6"}
 7
 {"v1":"16","n.id":"[15,16,17]","n.name":"['first','second','third']"}
diff --git a/tests/queries/0_stateless/01448_json_compact_strings_each_row.reference b/tests/queries/0_stateless/01448_json_compact_strings_each_row.reference
index 0b05f050b29..fb1a066f272 100644
--- a/tests/queries/0_stateless/01448_json_compact_strings_each_row.reference
+++ b/tests/queries/0_stateless/01448_json_compact_strings_each_row.reference
@@ -24,16 +24,16 @@
 ["first", "1", "2", "0"]
 ["second", "2", "0", "6"]
 6
-["first", "1", "2", "0"]
-["second", "2", "0", "6"]
+["first", "1", "2", "8"]
+["second", "2", "32", "6"]
 7
 ["16", "[15,16,17]", "['first','second','third']"]
 8
 ["first", "1", "2", "0"]
 ["second", "2", "0", "6"]
 9
-["first", "1", "2", "0"]
-["second", "2", "0", "6"]
+["first", "1", "2", "8"]
+["second", "2", "32", "6"]
 10
 ["first", "1", "16", "8"]
 ["second", "2", "32", "8"]

From f528cd9f97b4f7c54a6c22406f09983d055ce642 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 13:01:12 +0300
Subject: [PATCH 072/341] Forward compiler version to unbundled build

---
 docker/packager/packager | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/packager/packager b/docker/packager/packager
index 5874bedd17a..909f20acd6d 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -93,7 +93,7 @@ def parse_env_variables(build_type, compiler, sanitizer, package_type, image_typ
 
     cxx = cc.replace('gcc', 'g++').replace('clang', 'clang++')
 
-    if image_type == "deb":
+    if image_type == "deb" or image_type == "unbundled":
         result.append("DEB_CC={}".format(cc))
         result.append("DEB_CXX={}".format(cxx))
     elif image_type == "binary":

From ca6b634eb0466361da6f3526a6611ab0ccd8bfc1 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 13:51:01 +0300
Subject: [PATCH 073/341] Install gcc-10 from proposed repo

---
 docker/packager/binary/Dockerfile | 13 +++++++++++--
 docker/packager/deb/Dockerfile    | 12 ++++++++++--
 2 files changed, 21 insertions(+), 4 deletions(-)

diff --git a/docker/packager/binary/Dockerfile b/docker/packager/binary/Dockerfile
index 45c35c2e0f3..b911b59a41d 100644
--- a/docker/packager/binary/Dockerfile
+++ b/docker/packager/binary/Dockerfile
@@ -32,8 +32,6 @@ RUN apt-get update \
         curl \
         gcc-9 \
         g++-9 \
-        gcc-10 \
-        g++-10 \
         llvm-${LLVM_VERSION} \
         clang-${LLVM_VERSION} \
         lld-${LLVM_VERSION} \
@@ -93,5 +91,16 @@ RUN wget -nv "https://developer.arm.com/-/media/Files/downloads/gnu-a/8.3-2019.0
 # Download toolchain for FreeBSD 11.3
 RUN wget -nv https://clickhouse-datasets.s3.yandex.net/toolchains/toolchains/freebsd-11.3-toolchain.tar.xz
 
+# NOTE: For some reason we have outdated version of gcc-10 in ubuntu 20.04 stable.
+# Current workaround is to use latest version proposed repo. Remove as soon as
+# gcc-10.2 appear in stable repo.
+RUN echo 'deb http://archive.ubuntu.com/ubuntu/ focal-proposed restricted main multiverse universe' > /etc/apt/sources.list.d/proposed-repositories.list
+
+RUN apt-get update \
+    && apt-get install gcc-10 g++10 --yes
+
+RUN rm /etc/apt/sources.list.d/proposed-repositories.list
+
+
 COPY build.sh /
 CMD ["/bin/bash", "/build.sh"]
diff --git a/docker/packager/deb/Dockerfile b/docker/packager/deb/Dockerfile
index 87f4582f8e2..30334504c55 100644
--- a/docker/packager/deb/Dockerfile
+++ b/docker/packager/deb/Dockerfile
@@ -42,8 +42,6 @@ RUN  export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
 # Libraries from OS are only needed to test the "unbundled" build (this is not used in production).
 RUN apt-get update \
     && apt-get install \
-        gcc-10 \
-        g++-10 \
         gcc-9 \
         g++-9 \
         clang-11 \
@@ -75,6 +73,16 @@ RUN apt-get update \
         pigz \
         --yes --no-install-recommends
 
+# NOTE: For some reason we have outdated version of gcc-10 in ubuntu 20.04 stable.
+# Current workaround is to use latest version proposed repo. Remove as soon as
+# gcc-10.2 appear in stable repo.
+RUN echo 'deb http://archive.ubuntu.com/ubuntu/ focal-proposed restricted main multiverse universe' > /etc/apt/sources.list.d/proposed-repositories.list
+
+RUN apt-get update \
+    && apt-get install gcc-10 g++10 --yes --no-install-recommends
+
+RUN rm /etc/apt/sources.list.d/proposed-repositories.list
+
 # This symlink required by gcc to find lld compiler
 RUN ln -s /usr/bin/lld-${LLVM_VERSION} /usr/bin/ld.lld
 

From 150d8d4e79b0fff23cde361ed460e71c8729a4c5 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 14:11:59 +0300
Subject: [PATCH 074/341] Better recursive copy in integration tests

---
 tests/integration/helpers/cluster.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 6b8cdcf7989..44a22d3fe2e 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1,6 +1,5 @@
 import base64
 import cassandra.cluster
-import distutils.dir_util
 import docker
 import errno
 import httplib
@@ -19,6 +18,7 @@ import socket
 import subprocess
 import time
 import urllib
+import traceback
 import xml.dom.minidom
 from dicttoxml import dicttoxml
 from kazoo.client import KazooClient
@@ -667,6 +667,7 @@ class ClickHouseCluster:
         except BaseException, e:
             print "Failed to start cluster: "
             print str(e)
+            print traceback.print_exc()
             raise
 
     def shutdown(self, kill=True):
@@ -1164,10 +1165,10 @@ class ClickHouseInstance:
 
         db_dir = p.abspath(p.join(self.path, 'database'))
         print "Setup database dir {}".format(db_dir)
-        os.mkdir(db_dir)
         if self.clickhouse_path_dir is not None:
             print "Database files taken from {}".format(self.clickhouse_path_dir)
-            distutils.dir_util.copy_tree(self.clickhouse_path_dir, db_dir)
+            shutil.copytree(self.clickhouse_path_dir, db_dir)
+            print "Database copied from {} to {}".format(self.clickhouse_path_dir, db_dir)
 
         logs_dir = p.abspath(p.join(self.path, 'logs'))
         print "Setup logs dir {}".format(logs_dir)
@@ -1228,7 +1229,6 @@ class ClickHouseInstance:
             binary_volume = "- " + self.server_bin_path + ":/usr/share/clickhouse_fresh"
             odbc_bridge_volume = "- " + self.odbc_bridge_bin_path + ":/usr/share/clickhouse-odbc-bridge_fresh"
 
-
         with open(self.docker_compose_path, 'w') as docker_compose:
             docker_compose.write(DOCKER_COMPOSE_TEMPLATE.format(
                 image=self.image,
@@ -1251,8 +1251,8 @@ class ClickHouseInstance:
                 app_net=app_net,
                 ipv4_address=ipv4_address,
                 ipv6_address=ipv6_address,
-                net_aliases = net_aliases,
-                net_alias1 = net_alias1,
+                net_aliases=net_aliases,
+                net_alias1=net_alias1,
             ))
 
     def destroy_dir(self):

From 98f19a5d50b7c1a1017628f63813e6bbabb6a2e5 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 14:29:53 +0300
Subject: [PATCH 075/341] Better permissions

---
 .../clickhouse_path/format_schemas/rabbitmq.proto                 | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 mode change 100644 => 100755 tests/integration/test_storage_rabbitmq/clickhouse_path/format_schemas/rabbitmq.proto

diff --git a/tests/integration/test_storage_rabbitmq/clickhouse_path/format_schemas/rabbitmq.proto b/tests/integration/test_storage_rabbitmq/clickhouse_path/format_schemas/rabbitmq.proto
old mode 100644
new mode 100755

From 97616f2982b6c334ac9894fc302686982e1f0213 Mon Sep 17 00:00:00 2001
From: Simon Podlipsky <simon@podlipsky.net>
Date: Wed, 9 Sep 2020 13:33:34 +0200
Subject: [PATCH 076/341] Mention db requirement in dictionary functions

---
 docs/en/sql-reference/functions/ext-dict-functions.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/docs/en/sql-reference/functions/ext-dict-functions.md b/docs/en/sql-reference/functions/ext-dict-functions.md
index 49b1c2dda2c..e0ecdd74fad 100644
--- a/docs/en/sql-reference/functions/ext-dict-functions.md
+++ b/docs/en/sql-reference/functions/ext-dict-functions.md
@@ -3,6 +3,9 @@ toc_priority: 58
 toc_title: External Dictionaries
 ---
 
+!!! attention "Attention"
+    `dict_name` parameter must be fully qualified for dictionaries created with DDL queries. Eg. `<database>.<dict_name>`.
+
 # Functions for Working with External Dictionaries {#ext_dict_functions}
 
 For information on connecting and configuring external dictionaries, see [External dictionaries](../../sql-reference/dictionaries/external-dictionaries/external-dicts.md).

From c535d752438c9616dab8fac79bf8594acb44665a Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 14:47:34 +0300
Subject: [PATCH 077/341] Add update

---
 docker/packager/binary/Dockerfile | 2 +-
 docker/packager/deb/Dockerfile    | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docker/packager/binary/Dockerfile b/docker/packager/binary/Dockerfile
index b911b59a41d..893e9191b1e 100644
--- a/docker/packager/binary/Dockerfile
+++ b/docker/packager/binary/Dockerfile
@@ -99,7 +99,7 @@ RUN echo 'deb http://archive.ubuntu.com/ubuntu/ focal-proposed restricted main m
 RUN apt-get update \
     && apt-get install gcc-10 g++10 --yes
 
-RUN rm /etc/apt/sources.list.d/proposed-repositories.list
+RUN rm /etc/apt/sources.list.d/proposed-repositories.list && apt-get update
 
 
 COPY build.sh /
diff --git a/docker/packager/deb/Dockerfile b/docker/packager/deb/Dockerfile
index 30334504c55..4b7c2ae53a4 100644
--- a/docker/packager/deb/Dockerfile
+++ b/docker/packager/deb/Dockerfile
@@ -81,7 +81,7 @@ RUN echo 'deb http://archive.ubuntu.com/ubuntu/ focal-proposed restricted main m
 RUN apt-get update \
     && apt-get install gcc-10 g++10 --yes --no-install-recommends
 
-RUN rm /etc/apt/sources.list.d/proposed-repositories.list
+RUN rm /etc/apt/sources.list.d/proposed-repositories.list && apt-get update
 
 # This symlink required by gcc to find lld compiler
 RUN ln -s /usr/bin/lld-${LLVM_VERSION} /usr/bin/ld.lld

From a8f5d9e70fef1202285eab1911f7aa794e0828f6 Mon Sep 17 00:00:00 2001
From: myrrc <me@myrrec.space>
Date: Wed, 9 Sep 2020 15:52:44 +0300
Subject: [PATCH 078/341] added the test and comment

---
 src/Columns/ColumnLowCardinality.h                            | 4 ++++
 .../0_stateless/01414_low_cardinality_nullable.reference      | 1 +
 tests/queries/0_stateless/01414_low_cardinality_nullable.sql  | 2 ++
 3 files changed, 7 insertions(+)

diff --git a/src/Columns/ColumnLowCardinality.h b/src/Columns/ColumnLowCardinality.h
index 00f58a133cf..0aeda4567fd 100644
--- a/src/Columns/ColumnLowCardinality.h
+++ b/src/Columns/ColumnLowCardinality.h
@@ -171,6 +171,10 @@ public:
     bool isNumeric() const override { return getDictionary().isNumeric(); }
     bool lowCardinality() const override { return true; }
 
+    /**
+     * Checks if the dictionary column is Nullable(T).
+     * So LC(Nullable(T)) would return true, LC(U) -- false.
+     */
     bool nestedIsNullable() const { return isColumnNullable(*dictionary.getColumnUnique().getNestedColumn()); }
 
     const IColumnUnique & getDictionary() const { return dictionary.getColumnUnique(); }
diff --git a/tests/queries/0_stateless/01414_low_cardinality_nullable.reference b/tests/queries/0_stateless/01414_low_cardinality_nullable.reference
index bf7b6cf4f76..51825f5cb76 100644
--- a/tests/queries/0_stateless/01414_low_cardinality_nullable.reference
+++ b/tests/queries/0_stateless/01414_low_cardinality_nullable.reference
@@ -80,3 +80,4 @@
 1
 1
 1
+2
diff --git a/tests/queries/0_stateless/01414_low_cardinality_nullable.sql b/tests/queries/0_stateless/01414_low_cardinality_nullable.sql
index 6e311f9d519..9a554ead776 100644
--- a/tests/queries/0_stateless/01414_low_cardinality_nullable.sql
+++ b/tests/queries/0_stateless/01414_low_cardinality_nullable.sql
@@ -217,4 +217,6 @@ SELECT count() FROM lc_nullable WHERE has(date_time, toDateTime('1970-01-01 03:0
 SELECT count() FROM lc_nullable WHERE has(str, '100');
 SELECT count() FROM lc_nullable WHERE has(fixed_string, toFixedString('100', 5));
 
+SELECT count() FROM lc_nullable WHERE has(date, toDate(has(u64, 1), '1970-01\002'));
+
 DROP TABLE IF EXISTS lc_nullable;

From 956138635de536560d0843025720d7ce7b947cf3 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 15:59:26 +0300
Subject: [PATCH 079/341] Fix compiler name

---
 docker/packager/binary/Dockerfile | 2 +-
 docker/packager/deb/Dockerfile    | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docker/packager/binary/Dockerfile b/docker/packager/binary/Dockerfile
index 893e9191b1e..03bb3b5aefa 100644
--- a/docker/packager/binary/Dockerfile
+++ b/docker/packager/binary/Dockerfile
@@ -97,7 +97,7 @@ RUN wget -nv https://clickhouse-datasets.s3.yandex.net/toolchains/toolchains/fre
 RUN echo 'deb http://archive.ubuntu.com/ubuntu/ focal-proposed restricted main multiverse universe' > /etc/apt/sources.list.d/proposed-repositories.list
 
 RUN apt-get update \
-    && apt-get install gcc-10 g++10 --yes
+    && apt-get install gcc-10 g++-10 --yes
 
 RUN rm /etc/apt/sources.list.d/proposed-repositories.list && apt-get update
 
diff --git a/docker/packager/deb/Dockerfile b/docker/packager/deb/Dockerfile
index 4b7c2ae53a4..a3c87f13fe4 100644
--- a/docker/packager/deb/Dockerfile
+++ b/docker/packager/deb/Dockerfile
@@ -79,7 +79,7 @@ RUN apt-get update \
 RUN echo 'deb http://archive.ubuntu.com/ubuntu/ focal-proposed restricted main multiverse universe' > /etc/apt/sources.list.d/proposed-repositories.list
 
 RUN apt-get update \
-    && apt-get install gcc-10 g++10 --yes --no-install-recommends
+    && apt-get install gcc-10 g++-10 --yes --no-install-recommends
 
 RUN rm /etc/apt/sources.list.d/proposed-repositories.list && apt-get update
 

From b68782d285e5ea76f7318b55bf41cf337dfa71fc Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Wed, 9 Sep 2020 16:32:50 +0300
Subject: [PATCH 080/341] enable more tests with Atomic database

---
 docker/test/stress/stress                     |  2 +-
 programs/client/Client.cpp                    | 28 +++++++-
 src/Interpreters/DatabaseCatalog.cpp          |  5 +-
 src/Interpreters/InterpreterCreateQuery.cpp   |  1 +
 .../MergeTree/MergeTreeWriteAheadLog.cpp      |  1 +
 src/Storages/StorageReplicatedMergeTree.cpp   | 16 +++--
 src/Storages/System/StorageSystemTables.cpp   |  6 ++
 .../queries/0_stateless/00116_storage_set.sql |  2 +-
 .../00180_attach_materialized_view.sql        |  2 +-
 ...per_deduplication_and_unexpected_parts.sql |  2 +-
 .../00281_compile_sizeof_packed.re            |  0
 .../0_stateless/00311_array_primary_key.sql   |  2 +-
 .../00423_storage_log_single_thread.sql       |  6 +-
 .../00816_long_concurrent_alter_column.sh     | 27 +++++---
 .../01190_full_attach_syntax.reference        | 13 ++++
 .../0_stateless/01190_full_attach_syntax.sql  | 66 +++++++++++++++++++
 .../01305_replica_create_drop_zookeeper.sh    | 20 ++++--
 .../00065_loyalty_with_storage_join.sql       |  2 +-
 tests/queries/skip_list.json                  | 33 +---------
 19 files changed, 172 insertions(+), 62 deletions(-)
 delete mode 100644 tests/queries/0_stateless/00281_compile_sizeof_packed.re
 create mode 100644 tests/queries/0_stateless/01190_full_attach_syntax.reference
 create mode 100644 tests/queries/0_stateless/01190_full_attach_syntax.sql

diff --git a/docker/test/stress/stress b/docker/test/stress/stress
index e8675da1546..60db5ec465c 100755
--- a/docker/test/stress/stress
+++ b/docker/test/stress/stress
@@ -28,7 +28,7 @@ def get_options(i):
     options = ""
     if 0 < i:
         options += " --order=random"
-    if i == 1:
+    if i % 2 == 1:
         options += " --atomic-db-engine"
     return options
 
diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index c9701950dc5..83e4062b1f3 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -919,7 +919,33 @@ private:
         while (begin < end)
         {
             const char * pos = begin;
-            ASTPtr orig_ast = parseQuery(pos, end, true);
+
+            ASTPtr orig_ast;
+            try
+            {
+                orig_ast = parseQuery(pos, end, true);
+            }
+            catch (Exception & e)
+            {
+                if (!test_mode)
+                    throw;
+
+                /// Try find test hint for syntax error
+                const char * end_of_line = find_first_symbols<'\n'>(begin, end);
+                TestHint hint(true, String(begin, end_of_line - begin));
+                if (hint.serverError()) /// Syntax errors are considered as client errors
+                    throw;
+                if (hint.clientError() != e.code())
+                {
+                    if (hint.clientError())
+                        e.addMessage("\nExpected clinet error: " + std::to_string(hint.clientError()));
+                    throw;
+                }
+
+                /// It's expected syntax error, skip the line
+                begin = end_of_line;
+                continue;
+            }
 
             if (!orig_ast)
             {
diff --git a/src/Interpreters/DatabaseCatalog.cpp b/src/Interpreters/DatabaseCatalog.cpp
index 6153f6b52fb..049341918b9 100644
--- a/src/Interpreters/DatabaseCatalog.cpp
+++ b/src/Interpreters/DatabaseCatalog.cpp
@@ -657,7 +657,10 @@ void DatabaseCatalog::enqueueDroppedTableCleanup(StorageID table_id, StoragePtr
     /// Table was removed from database. Enqueue removal of its data from disk.
     time_t drop_time;
     if (table)
+    {
         drop_time = std::chrono::system_clock::to_time_t(std::chrono::system_clock::now());
+        table->is_dropped = true;
+    }
     else
     {
         /// Try load table from metadata to drop it correctly (e.g. remove metadata from zk or remove data from all volumes)
@@ -674,6 +677,7 @@ void DatabaseCatalog::enqueueDroppedTableCleanup(StorageID table_id, StoragePtr
             try
             {
                 table = createTableFromAST(*create, table_id.getDatabaseName(), data_path, *global_context, false).second;
+                table->is_dropped = true;
             }
             catch (...)
             {
@@ -763,7 +767,6 @@ void DatabaseCatalog::dropTableFinally(const TableMarkedAsDropped & table) const
     if (table.table)
     {
         table.table->drop();
-        table.table->is_dropped = true;
     }
 
     /// Even if table is not loaded, try remove its data from disk.
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 06973ab029b..d7230940bb2 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -673,6 +673,7 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
         create.attach_short_syntax = true;
         create.if_not_exists = if_not_exists;
     }
+    /// TODO maybe assert table structure if create.attach_short_syntax is false?
 
     if (!create.temporary && create.database.empty())
         create.database = current_database;
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
index 53ef72f3208..3fa3a7e3e40 100644
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
+++ b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
@@ -66,6 +66,7 @@ void MergeTreeWriteAheadLog::dropPart(const String & part_name)
     writeIntBinary(static_cast<UInt8>(0), *out);
     writeIntBinary(static_cast<UInt8>(ActionType::DROP_PART), *out);
     writeStringBinary(part_name, *out);
+    out->next();
 }
 
 void MergeTreeWriteAheadLog::rotate(const std::lock_guard<std::mutex> &)
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6058632d220..6458fe127da 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -4260,9 +4260,13 @@ bool StorageReplicatedMergeTree::waitForReplicaToProcessLogEntry(
       * To do this, check its node `log_pointer` - the maximum number of the element taken from `log` + 1.
       */
 
-    const auto & check_replica_become_inactive = [this, &replica]()
+    bool waiting_itself = replica == replica_name;
+
+    const auto & stop_waiting = [&]()
     {
-        return !getZooKeeper()->exists(zookeeper_path + "/replicas/" + replica + "/is_active");
+        bool stop_waiting_itself = waiting_itself && is_dropped;
+        bool stop_waiting_non_active = !wait_for_non_active && !getZooKeeper()->exists(zookeeper_path + "/replicas/" + replica + "/is_active");
+        return stop_waiting_itself || stop_waiting_non_active;
     };
     constexpr auto event_wait_timeout_ms = 1000;
 
@@ -4277,7 +4281,7 @@ bool StorageReplicatedMergeTree::waitForReplicaToProcessLogEntry(
         LOG_DEBUG(log, "Waiting for {} to pull {} to queue", replica, log_node_name);
 
         /// Let's wait until entry gets into the replica queue.
-        while (wait_for_non_active || !check_replica_become_inactive())
+        while (!stop_waiting())
         {
             zkutil::EventPtr event = std::make_shared<Poco::Event>();
 
@@ -4325,7 +4329,7 @@ bool StorageReplicatedMergeTree::waitForReplicaToProcessLogEntry(
             LOG_DEBUG(log, "Waiting for {} to pull {} to queue", replica, log_node_name);
 
             /// Let's wait until the entry gets into the replica queue.
-            while (wait_for_non_active || !check_replica_become_inactive())
+            while (!stop_waiting())
             {
                 zkutil::EventPtr event = std::make_shared<Poco::Event>();
 
@@ -4378,10 +4382,8 @@ bool StorageReplicatedMergeTree::waitForReplicaToProcessLogEntry(
 
     /// Third - wait until the entry disappears from the replica queue or replica become inactive.
     String path_to_wait_on = zookeeper_path + "/replicas/" + replica + "/queue/" + queue_entry_to_wait_for;
-    if (wait_for_non_active)
-        return getZooKeeper()->waitForDisappear(path_to_wait_on);
 
-    return getZooKeeper()->waitForDisappear(path_to_wait_on, check_replica_become_inactive);
+    return getZooKeeper()->waitForDisappear(path_to_wait_on, stop_waiting);
 }
 
 
diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index 5b7dad836e9..0ad961ad7d8 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -344,6 +344,12 @@ protected:
                 {
                     ASTPtr ast = database->tryGetCreateTableQuery(table_name, context);
 
+                    if (ast && !context.getSettingsRef().show_table_uuid_in_table_create_query_if_not_nil)
+                    {
+                        auto & create = ast->as<ASTCreateQuery &>();
+                        create.uuid = UUIDHelpers::Nil;
+                    }
+
                     if (columns_mask[src_index++])
                         res_columns[res_index++]->insert(ast ? queryToString(ast) : "");
 
diff --git a/tests/queries/0_stateless/00116_storage_set.sql b/tests/queries/0_stateless/00116_storage_set.sql
index aa93a0620d0..0eeed7e859a 100644
--- a/tests/queries/0_stateless/00116_storage_set.sql
+++ b/tests/queries/0_stateless/00116_storage_set.sql
@@ -19,7 +19,7 @@ INSERT INTO set2 VALUES ('abc'), ('World');
 SELECT arrayJoin(['Hello', 'test', 'World', 'world', 'abc', 'xyz']) AS s WHERE s IN set2;
 
 DETACH TABLE set2;
-ATTACH TABLE set2 (x String) ENGINE = Set;
+ATTACH TABLE set2;
 
 SELECT arrayJoin(['Hello', 'test', 'World', 'world', 'abc', 'xyz']) AS s WHERE s IN set2;
 
diff --git a/tests/queries/0_stateless/00180_attach_materialized_view.sql b/tests/queries/0_stateless/00180_attach_materialized_view.sql
index 089e4926bcf..d674c0bd277 100644
--- a/tests/queries/0_stateless/00180_attach_materialized_view.sql
+++ b/tests/queries/0_stateless/00180_attach_materialized_view.sql
@@ -6,7 +6,7 @@ CREATE TABLE t_00180 (x UInt8) ENGINE = Null;
 CREATE MATERIALIZED VIEW mv_00180 ENGINE = Null AS SELECT * FROM t_00180;
 
 DETACH TABLE mv_00180;
-ATTACH MATERIALIZED VIEW mv_00180 ENGINE = Null AS SELECT * FROM t_00180;
+ATTACH TABLE mv_00180;
 
 DROP TABLE t_00180;
 DROP TABLE mv_00180;
diff --git a/tests/queries/0_stateless/00226_zookeeper_deduplication_and_unexpected_parts.sql b/tests/queries/0_stateless/00226_zookeeper_deduplication_and_unexpected_parts.sql
index 623218af167..c14ce53d4a3 100644
--- a/tests/queries/0_stateless/00226_zookeeper_deduplication_and_unexpected_parts.sql
+++ b/tests/queries/0_stateless/00226_zookeeper_deduplication_and_unexpected_parts.sql
@@ -21,7 +21,7 @@ INSERT INTO deduplication (x) VALUES (1);
 SELECT * FROM deduplication;
 
 DETACH TABLE deduplication;
-ATTACH TABLE deduplication (d Date DEFAULT '2015-01-01', x Int8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/test_00226/deduplication', 'r1', d, x, 1);
+ATTACH TABLE deduplication;
 
 SELECT * FROM deduplication;
 
diff --git a/tests/queries/0_stateless/00281_compile_sizeof_packed.re b/tests/queries/0_stateless/00281_compile_sizeof_packed.re
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/queries/0_stateless/00311_array_primary_key.sql b/tests/queries/0_stateless/00311_array_primary_key.sql
index 0ea368609da..0e066c64f89 100644
--- a/tests/queries/0_stateless/00311_array_primary_key.sql
+++ b/tests/queries/0_stateless/00311_array_primary_key.sql
@@ -11,7 +11,7 @@ INSERT INTO array_pk VALUES ([5, 6], 'ghi', 6);
 SELECT * FROM array_pk ORDER BY n;
 
 DETACH TABLE array_pk;
-ATTACH TABLE array_pk (key Array(UInt8), s String, n UInt64, d Date MATERIALIZED '2000-01-01') ENGINE = MergeTree(d, (key, s, n), 1);
+ATTACH TABLE array_pk;
 
 SELECT * FROM array_pk ORDER BY n;
 
diff --git a/tests/queries/0_stateless/00423_storage_log_single_thread.sql b/tests/queries/0_stateless/00423_storage_log_single_thread.sql
index 7d5e14c9ee5..8eff9323564 100644
--- a/tests/queries/0_stateless/00423_storage_log_single_thread.sql
+++ b/tests/queries/0_stateless/00423_storage_log_single_thread.sql
@@ -5,7 +5,7 @@ SELECT * FROM log LIMIT 1;
 SELECT * FROM log;
 
 DETACH TABLE log;
-ATTACH TABLE log (s String) ENGINE = Log;
+ATTACH TABLE log;
 
 SELECT * FROM log;
 SELECT * FROM log LIMIT 1;
@@ -15,13 +15,13 @@ INSERT INTO log VALUES ('Hello'), ('World');
 SELECT * FROM log LIMIT 1;
 
 DETACH TABLE log;
-ATTACH TABLE log (s String) ENGINE = Log;
+ATTACH TABLE log;
 
 SELECT * FROM log LIMIT 1;
 SELECT * FROM log;
 
 DETACH TABLE log;
-ATTACH TABLE log (s String) ENGINE = Log;
+ATTACH TABLE log;
 
 SELECT * FROM log;
 SELECT * FROM log LIMIT 1;
diff --git a/tests/queries/0_stateless/00816_long_concurrent_alter_column.sh b/tests/queries/0_stateless/00816_long_concurrent_alter_column.sh
index 93421e003f6..8fdd6654bae 100755
--- a/tests/queries/0_stateless/00816_long_concurrent_alter_column.sh
+++ b/tests/queries/0_stateless/00816_long_concurrent_alter_column.sh
@@ -11,34 +11,34 @@ echo "CREATE TABLE concurrent_alter_column (ts DATETIME) ENGINE = MergeTree PART
 function thread1()
 {
     while true; do
-        for i in {1..500}; do echo "ALTER TABLE concurrent_alter_column ADD COLUMN c$i DOUBLE;"; done | ${CLICKHOUSE_CLIENT} -n --query_id=alter1
+        for i in {1..500}; do echo "ALTER TABLE concurrent_alter_column ADD COLUMN c$i DOUBLE;"; done | ${CLICKHOUSE_CLIENT} -n --query_id=alter_00816_1
     done
 }
 
 function thread2()
 {
     while true; do
-        echo "ALTER TABLE concurrent_alter_column ADD COLUMN d DOUBLE" | ${CLICKHOUSE_CLIENT} --query_id=alter2;
+        echo "ALTER TABLE concurrent_alter_column ADD COLUMN d DOUBLE" | ${CLICKHOUSE_CLIENT} --query_id=alter_00816_2;
         sleep "$(echo 0.0$RANDOM)";
-        echo "ALTER TABLE concurrent_alter_column DROP COLUMN d" | ${CLICKHOUSE_CLIENT} --query_id=alter2;
+        echo "ALTER TABLE concurrent_alter_column DROP COLUMN d" | ${CLICKHOUSE_CLIENT} --query_id=alter_00816_2;
     done
 }
 
 function thread3()
 {
     while true; do
-        echo "ALTER TABLE concurrent_alter_column ADD COLUMN e DOUBLE" | ${CLICKHOUSE_CLIENT} --query_id=alter3;
+        echo "ALTER TABLE concurrent_alter_column ADD COLUMN e DOUBLE" | ${CLICKHOUSE_CLIENT} --query_id=alter_00816_3;
         sleep "$(echo 0.0$RANDOM)";
-        echo "ALTER TABLE concurrent_alter_column DROP COLUMN e" | ${CLICKHOUSE_CLIENT} --query_id=alter3;
+        echo "ALTER TABLE concurrent_alter_column DROP COLUMN e" | ${CLICKHOUSE_CLIENT} --query_id=alter_00816_3;
     done
 }
 
 function thread4()
 {
     while true; do
-        echo "ALTER TABLE concurrent_alter_column ADD COLUMN f DOUBLE" | ${CLICKHOUSE_CLIENT} --query_id=alter4;
+        echo "ALTER TABLE concurrent_alter_column ADD COLUMN f DOUBLE" | ${CLICKHOUSE_CLIENT} --query_id=alter_00816_4;
         sleep "$(echo 0.0$RANDOM)";
-        echo "ALTER TABLE concurrent_alter_column DROP COLUMN f" | ${CLICKHOUSE_CLIENT} --query_id=alter4;
+        echo "ALTER TABLE concurrent_alter_column DROP COLUMN f" | ${CLICKHOUSE_CLIENT} --query_id=alter_00816_4;
     done
 }
 
@@ -57,9 +57,18 @@ timeout $TIMEOUT bash -c thread4 2> /dev/null &
 
 wait
 
-echo "DROP TABLE concurrent_alter_column" | ${CLICKHOUSE_CLIENT}
+echo "DROP TABLE concurrent_alter_column NO DELAY" | ${CLICKHOUSE_CLIENT}   # NO DELAY has effect only for Atomic database
+
+db_engine=`$CLICKHOUSE_CLIENT -q "SELECT engine FROM system.databases WHERE name=currentDatabase()"`
+if [[ $db_engine == "Atomic" ]]; then
+    # DROP is non-blocking, so wait for alters
+    while true; do
+        $CLICKHOUSE_CLIENT -q "SELECT c = 0 FROM (SELECT count() as c FROM system.processes WHERE query_id LIKE 'alter_00816_%')" | grep 1 > /dev/null && break;
+        sleep 1;
+    done
+fi
 
 # Check for deadlocks
-echo "SELECT * FROM system.processes WHERE query_id LIKE 'alter%'" | ${CLICKHOUSE_CLIENT}
+echo "SELECT * FROM system.processes WHERE query_id LIKE 'alter_00816_%'" | ${CLICKHOUSE_CLIENT}
 
 echo 'did not crash'
diff --git a/tests/queries/0_stateless/01190_full_attach_syntax.reference b/tests/queries/0_stateless/01190_full_attach_syntax.reference
new file mode 100644
index 00000000000..619861849c8
--- /dev/null
+++ b/tests/queries/0_stateless/01190_full_attach_syntax.reference
@@ -0,0 +1,13 @@
+CREATE DICTIONARY test_01190.dict\n(\n    `key` UInt64 DEFAULT 0,\n    `col` UInt8 DEFAULT 1\n)\nPRIMARY KEY key\nSOURCE(CLICKHOUSE(HOST \'localhost\' PORT 9000 USER \'default\' TABLE \'table_for_dict\' PASSWORD \'\' DB \'test_01190\'))\nLIFETIME(MIN 1 MAX 10)\nLAYOUT(FLAT())
+CREATE DICTIONARY test_01190.dict\n(\n    `key` UInt64 DEFAULT 0,\n    `col` UInt8 DEFAULT 1\n)\nPRIMARY KEY key\nSOURCE(CLICKHOUSE(HOST \'localhost\' PORT 9000 USER \'default\' TABLE \'table_for_dict\' PASSWORD \'\' DB \'test_01190\'))\nLIFETIME(MIN 1 MAX 10)\nLAYOUT(FLAT())
+CREATE TABLE default.log\n(\n    `s` String\n)\nENGINE = Log
+CREATE TABLE default.log\n(\n    `s` String\n)\nENGINE = Log()
+test
+CREATE TABLE default.mt\n(\n    `key` Array(UInt8),\n    `s` String,\n    `n` UInt64,\n    `d` Date MATERIALIZED \'2000-01-01\'\n)\nENGINE = MergeTree(d, (key, s, n), 1)
+[1,2]	Hello	2
+CREATE TABLE default.mt\n(\n    `key` Array(UInt8),\n    `s` String,\n    `n` UInt64,\n    `d` Date\n)\nENGINE = MergeTree(d, (key, s, n), 1)
+CREATE MATERIALIZED VIEW default.mv\n(\n    `s` String\n)\nENGINE = Null AS\nSELECT *\nFROM default.log
+CREATE MATERIALIZED VIEW default.mv\n(\n    `s` String\n)\nENGINE = Null AS\nSELECT *\nFROM default.log
+CREATE MATERIALIZED VIEW default.mv\n(\n    `key` Array(UInt8),\n    `s` String,\n    `n` UInt64,\n    `d` Date\n)\nENGINE = Null AS\nSELECT *\nFROM default.mt
+CREATE LIVE VIEW default.lv\n(\n    `1` UInt8\n) AS\nSELECT 1
+CREATE LIVE VIEW default.lv\n(\n    `1` UInt8\n) AS\nSELECT 1
diff --git a/tests/queries/0_stateless/01190_full_attach_syntax.sql b/tests/queries/0_stateless/01190_full_attach_syntax.sql
new file mode 100644
index 00000000000..3a91eccc8cd
--- /dev/null
+++ b/tests/queries/0_stateless/01190_full_attach_syntax.sql
@@ -0,0 +1,66 @@
+DROP DATABASE IF EXISTS test_01190;
+CREATE DATABASE test_01190;
+
+CREATE TABLE test_01190.table_for_dict (key UInt64, col UInt8) ENGINE = Memory;
+
+CREATE DICTIONARY test_01190.dict (key UInt64 DEFAULT 0, col UInt8 DEFAULT 1) PRIMARY KEY key SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE 'table_for_dict' PASSWORD '' DB 'test_01190')) LIFETIME(MIN 1 MAX 10) LAYOUT(FLAT());
+
+SHOW CREATE DICTIONARY test_01190.dict;
+
+DETACH DICTIONARY test_01190.dict;
+ATTACH TABLE test_01190.dict; -- { serverError 80 }
+-- Full ATTACH syntax is not allowed for dictionaries
+ATTACH DICTIONARY test_01190.dict (key UInt64 DEFAULT 0, col UInt8 DEFAULT 42) PRIMARY KEY key SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE 'table_for_dict' PASSWORD '' DB 'test_01190')) LIFETIME(MIN 1 MAX 100) LAYOUT(FLAT()); -- { clientError 62 }
+ATTACH DICTIONARY test_01190.dict;
+SHOW CREATE DICTIONARY test_01190.dict;
+
+DROP DATABASE test_01190;
+
+
+DROP TABLE IF EXISTS log;
+DROP TABLE IF EXISTS mt;
+DROP TABLE IF EXISTS mv;
+DROP TABLE IF EXISTS lv;
+
+CREATE TABLE log ENGINE = Log AS SELECT 'test' AS s;
+SHOW CREATE log;
+DETACH TABLE log;
+ATTACH DICTIONARY log; -- { serverError 487 }
+ATTACH TABLE log (s String) ENGINE = Log();
+SHOW CREATE log;
+SELECT * FROM log;
+
+DROP TABLE IF EXISTS mt;
+CREATE TABLE mt (key Array(UInt8), s String, n UInt64, d Date MATERIALIZED '2000-01-01') ENGINE = MergeTree(d, (key, s, n), 1);
+INSERT INTO mt VALUES ([1, 2], 'Hello', 2);
+DETACH TABLE mt;
+ATTACH TABLE mt (key Array(UInt8), s String, n UInt64, d Date MATERIALIZED '2000-01-01') ENGINE = MergeTree ORDER BY (key, s, n) PARTITION BY toYYYYMM(d); -- { serverError 342 }
+ATTACH TABLE mt (key Array(UInt8), s String, n UInt64, d Date MATERIALIZED '2000-01-01') ENGINE = MergeTree(d, (key, s, n), 1);
+SHOW CREATE mt;
+SELECT * FROM mt;
+DETACH TABLE mt;
+ATTACH TABLE mt (key Array(UInt8), s String, n UInt64, d Date) ENGINE = MergeTree(d, (key, s, n), 1);   -- It works (with Ordinary database), but probably it shouldn't
+SHOW CREATE mt;
+
+CREATE MATERIALIZED VIEW mv ENGINE = Null AS SELECT * FROM log;
+SHOW CREATE mv;
+DETACH VIEW mv;
+ATTACH MATERIALIZED VIEW mv ENGINE = Null AS SELECT * FROM log;
+SHOW CREATE mv;
+DETACH VIEW mv;
+ATTACH MATERIALIZED VIEW mv ENGINE = Null AS SELECT * FROM mt;  -- It works (with Ordinary database), but probably it shouldn't
+SHOW CREATE mv;
+
+SET allow_experimental_live_view = 1;
+CREATE LIVE VIEW lv AS SELECT 1;
+SHOW CREATE lv;
+DETACH VIEW lv;
+ATTACH LIVE VIEW lv AS SELECT 1;
+SHOW CREATE lv;
+
+DROP TABLE log;
+DROP TABLE mt;
+DROP TABLE mv;
+DROP TABLE lv;
+
+
diff --git a/tests/queries/0_stateless/01305_replica_create_drop_zookeeper.sh b/tests/queries/0_stateless/01305_replica_create_drop_zookeeper.sh
index 0a47c6df46c..1313830d589 100755
--- a/tests/queries/0_stateless/01305_replica_create_drop_zookeeper.sh
+++ b/tests/queries/0_stateless/01305_replica_create_drop_zookeeper.sh
@@ -7,11 +7,21 @@ set -e
 
 function thread()
 {
-    while true; do
-        $CLICKHOUSE_CLIENT -n -q "DROP TABLE IF EXISTS test_table_$1;
-            CREATE TABLE test_table_$1 (a UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/test_01305/alter_table', 'r_$1') ORDER BY tuple();" 2>&1 |
-                grep -vP '(^$)|(^Received exception from server)|(^\d+\. )|because the last replica of the table was dropped right now|is already started to be removing by another replica right now|is already finished removing by another replica right now|Removing leftovers from table|Another replica was suddenly created|was successfully removed from ZooKeeper|was created by another server at the same moment|was suddenly removed|some other replicas were created at the same time'
-        done
+    db_engine=`$CLICKHOUSE_CLIENT -q "SELECT engine FROM system.databases WHERE name=currentDatabase()"`
+    if [[ $db_engine == "Atomic" ]]; then
+        # Ignore "Replica already exists" exception
+        while true; do
+            $CLICKHOUSE_CLIENT -n -q "DROP TABLE IF EXISTS test_table_$1 NO DELAY;
+                CREATE TABLE test_table_$1 (a UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/test_01305/alter_table', 'r_$1') ORDER BY tuple();" 2>&1 |
+                    grep -vP '(^$)|(^Received exception from server)|(^\d+\. )|because the last replica of the table was dropped right now|is already started to be removing by another replica right now|is already finished removing by another replica right now|Removing leftovers from table|Another replica was suddenly created|was successfully removed from ZooKeeper|was created by another server at the same moment|was suddenly removed|some other replicas were created at the same time|already exists'
+            done
+    else
+        while true; do
+            $CLICKHOUSE_CLIENT -n -q "DROP TABLE IF EXISTS test_table_$1;
+                CREATE TABLE test_table_$1 (a UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/test_01305/alter_table', 'r_$1') ORDER BY tuple();" 2>&1 |
+                    grep -vP '(^$)|(^Received exception from server)|(^\d+\. )|because the last replica of the table was dropped right now|is already started to be removing by another replica right now|is already finished removing by another replica right now|Removing leftovers from table|Another replica was suddenly created|was successfully removed from ZooKeeper|was created by another server at the same moment|was suddenly removed|some other replicas were created at the same time'
+            done
+    fi
 }
 
 
diff --git a/tests/queries/1_stateful/00065_loyalty_with_storage_join.sql b/tests/queries/1_stateful/00065_loyalty_with_storage_join.sql
index 15a2a75cf58..515a2410583 100644
--- a/tests/queries/1_stateful/00065_loyalty_with_storage_join.sql
+++ b/tests/queries/1_stateful/00065_loyalty_with_storage_join.sql
@@ -22,7 +22,7 @@ GROUP BY loyalty
 ORDER BY loyalty ASC;
 
 DETACH TABLE join;
-ATTACH TABLE join (UserID UInt64, loyalty Int8) ENGINE = Join(SEMI, LEFT, UserID);
+ATTACH TABLE join;
 
 SELECT
     loyalty,
diff --git a/tests/queries/skip_list.json b/tests/queries/skip_list.json
index adfc5f0e582..efd622402b2 100644
--- a/tests/queries/skip_list.json
+++ b/tests/queries/skip_list.json
@@ -3,10 +3,8 @@
   */
 {
     "thread-sanitizer": [
-        "00281",
         "00877",
         "00985",
-        "avx2",
         "query_profiler",
         "memory_profiler",
         /// 01083 and 00505 and 00505 are critical and temproray disabled
@@ -21,9 +19,7 @@
         "01193_metadata_loading"
     ],
     "address-sanitizer": [
-        "00281",
         "00877",
-        "avx2",
         "query_profiler",
         "memory_profiler",
         "odbc_roundtrip",
@@ -31,9 +27,7 @@
         "01193_metadata_loading"
     ],
     "ub-sanitizer": [
-        "00281",
         "capnproto",
-        "avx2",
         "query_profiler",
         "memory_profiler",
         "01103_check_cpu_instructions_at_startup",
@@ -41,9 +35,7 @@
         "01193_metadata_loading"
     ],
     "memory-sanitizer": [
-        "00281",
         "capnproto",
-        "avx2",
         "query_profiler",
         "memory_profiler",
         "01103_check_cpu_instructions_at_startup",
@@ -53,8 +45,6 @@
         "01193_metadata_loading"
     ],
     "debug-build": [
-        "00281",
-        "avx2",
         "query_profiler",
         "memory_profiler",
         "00899_long_attach",
@@ -70,12 +60,10 @@
     ],
     "unbundled-build": [
         "00429",
-        "00428",
         "00877",
         "pocopatch",
         "parquet",
         "xxhash",
-        "avx2",
         "_h3",
         "query_profiler",
         "memory_profiler",
@@ -98,33 +86,19 @@
         "01455_time_zones"
     ],
     "release-build": [
-        "avx2"
     ],
     "database-atomic": [
-        "00065_loyalty_with_storage_join",
-        "avx",
         /// Inner tables of materialized views have different names
         "00738_lock_for_inner_table",
-        "00699_materialized_view_mutations",
         "00609_mv_index_in_in",
         "00510_materizlized_view_and_deduplication_zookeeper",
-        /// Create queries contain UUID
+        /// Different database engine
         "00604_show_create_database",
-        "00080_show_tables_and_system_tables",
-        "01272_suspicious_codecs",
         /// UUID must be specified in ATTACH TABLE
-        "01249_bad_arguments_for_bloom_filter",
-        "00423_storage_log_single_thread",
-        "00311_array_primary_key",
-        "00226_zookeeper_deduplication_and_unexpected_parts",
-        "00180_attach_materialized_view",
-        "00116_storage_set",
+        "01190_full_attach_syntax",
         /// Assumes blocking DROP
-        "00816_long_concurrent_alter_column",
-        "00992_system_parts_race_condition_zookeeper", /// FIXME
         "01320_create_sync_race_condition",
-        "01305_replica_create_drop_zookeeper",
-        "01130_in_memory_parts_partitons",
+        /// Internal distionary name is different
         "01225_show_create_table_from_dictionary",
         "01224_no_superfluous_dict_reload"
     ],
@@ -132,7 +106,6 @@
         /// These tests fail with compact parts, because they
         /// check some implementation defined things
         /// like checksums, computed granularity, ProfileEvents, etc.
-        "avx",
         "01045_order_by_pk_special_storages",
         "01042_check_query_and_last_granule_size",
         "00961_checksums_in_system_parts_columns_table",

From 83ec93dec868a1e17950f6298b5ec1ce0d5352db Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Wed, 9 Sep 2020 16:46:59 +0300
Subject: [PATCH 081/341] Fuzzer: reset default database before reconnect

---
 programs/client/Client.cpp | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index c9701950dc5..99598c70397 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -866,6 +866,8 @@ private:
             // will exit. The ping() would be the best match here, but it's
             // private, probably for a good reason that the protocol doesn't allow
             // pings at any possible moment.
+            // Don't forget to reset the default database which might have changed.
+            connection->setDefaultDatabase("");
             connection->forceConnected(connection_parameters.timeouts);
 
             if (text.size() > 4 * 1024)
@@ -1103,7 +1105,9 @@ private:
                 {
                     last_exception_received_from_server = std::make_unique<Exception>(getCurrentExceptionMessage(true), getCurrentExceptionCode());
                     received_exception_from_server = true;
-                    std::cerr << "Error on processing query: " << ast_to_process->formatForErrorMessage() << std::endl << last_exception_received_from_server->message();
+                    fmt::print(stderr, "Error on processing query '{}': {}\n",
+                        ast_to_process->formatForErrorMessage(),
+                        last_exception_received_from_server->message());
                 }
 
                 if (!connection->isConnected())

From 50dee3f4493d7ffb2c75d195cc39862f8f8d8a86 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 17:43:17 +0300
Subject: [PATCH 082/341] Remove false-positive warning

---
 src/Storages/MergeTree/MergeTreePartition.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index 4a846f63b7c..8ef3e458871 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -29,6 +29,9 @@ String MergeTreePartition::getID(const MergeTreeData & storage) const
     return getID(storage.getInMemoryMetadataPtr()->getPartitionKey().sample_block);
 }
 
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wstringop-overflow"
+
 /// NOTE: This ID is used to create part names which are then persisted in ZK and as directory names on the file system.
 /// So if you want to change this method, be sure to guarantee compatibility with existing table data.
 String MergeTreePartition::getID(const Block & partition_key_sample) const
@@ -87,6 +90,8 @@ String MergeTreePartition::getID(const Block & partition_key_sample) const
     return result;
 }
 
+#pragma GCC diagnostic pop
+
 void MergeTreePartition::serializeText(const MergeTreeData & storage, WriteBuffer & out, const FormatSettings & format_settings) const
 {
     auto metadata_snapshot = storage.getInMemoryMetadataPtr();

From 673244876ea15008b54bf93e9d535a0a65e68696 Mon Sep 17 00:00:00 2001
From: Mikhail Cheshkov <mcheshkov@gmail.com>
Date: Wed, 9 Sep 2020 17:57:15 +0300
Subject: [PATCH 083/341] Use global ICU ADDINCL for Arcadia build

---
 src/Columns/ya.make      | 2 --
 src/Functions/ya.make    | 1 -
 src/Functions/ya.make.in | 1 -
 3 files changed, 4 deletions(-)

diff --git a/src/Columns/ya.make b/src/Columns/ya.make
index 78c0e1b992d..910c479c2a9 100644
--- a/src/Columns/ya.make
+++ b/src/Columns/ya.make
@@ -2,8 +2,6 @@
 LIBRARY()
 
 ADDINCL(
-    contrib/libs/icu/common
-    contrib/libs/icu/i18n
     contrib/libs/pdqsort
 )
 
diff --git a/src/Functions/ya.make b/src/Functions/ya.make
index b9a7b5b64ea..f48b4d607ed 100644
--- a/src/Functions/ya.make
+++ b/src/Functions/ya.make
@@ -10,7 +10,6 @@ ADDINCL(
     contrib/libs/farmhash
     contrib/libs/h3/h3lib/include
     contrib/libs/hyperscan/src
-    contrib/libs/icu/common
     contrib/libs/libdivide
     contrib/libs/rapidjson/include
     contrib/libs/xxhash
diff --git a/src/Functions/ya.make.in b/src/Functions/ya.make.in
index a5a54d94c6c..2a66aa5553e 100644
--- a/src/Functions/ya.make.in
+++ b/src/Functions/ya.make.in
@@ -9,7 +9,6 @@ ADDINCL(
     contrib/libs/farmhash
     contrib/libs/h3/h3lib/include
     contrib/libs/hyperscan/src
-    contrib/libs/icu/common
     contrib/libs/libdivide
     contrib/libs/rapidjson/include
     contrib/libs/xxhash

From 7f4106687cb14491246f218654ed8a0a3b751b29 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Wed, 9 Sep 2020 19:23:31 +0300
Subject: [PATCH 084/341] fix

---
 tests/queries/0_stateless/01114_database_atomic.reference | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01114_database_atomic.reference b/tests/queries/0_stateless/01114_database_atomic.reference
index 7980819f9af..a79784230a6 100644
--- a/tests/queries/0_stateless/01114_database_atomic.reference
+++ b/tests/queries/0_stateless/01114_database_atomic.reference
@@ -7,7 +7,7 @@ test_01114_3	Ordinary	test_01114_3	test_01114_3	1
 20
 100
 CREATE TABLE test_01114_2.mt UUID \'00001114-0000-4000-8000-000000000002\'\n(\n    `n` UInt64\n)\nENGINE = MergeTree()\nPARTITION BY n % 5\nORDER BY tuple()\nSETTINGS index_granularity = 8192
-mt	00001114-0000-4000-8000-000000000002	CREATE TABLE test_01114_2.mt UUID \'00001114-0000-4000-8000-000000000002\' (`n` UInt64) ENGINE = MergeTree() PARTITION BY n % 5 ORDER BY tuple() SETTINGS index_granularity = 8192
+mt	00001114-0000-4000-8000-000000000002	CREATE TABLE test_01114_2.mt (`n` UInt64) ENGINE = MergeTree() PARTITION BY n % 5 ORDER BY tuple() SETTINGS index_granularity = 8192
 20
 CREATE TABLE test_01114_1.mt UUID \'00001114-0000-4000-8000-000000000001\'\n(\n    `n` UInt64\n)\nENGINE = MergeTree()\nPARTITION BY n % 5\nORDER BY tuple()\nSETTINGS index_granularity = 8192
 CREATE TABLE test_01114_2.mt UUID \'00001114-0000-4000-8000-000000000002\'\n(\n    `n` UInt64\n)\nENGINE = MergeTree()\nPARTITION BY n % 5\nORDER BY tuple()\nSETTINGS index_granularity = 8192

From d1d3af7501a35629d48b046387dfb95e0731f657 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Wed, 9 Sep 2020 00:22:24 -0700
Subject: [PATCH 085/341] StorageReplicatedMergeTree - more improvements to
 integration test

---
 .../__init__.py                               |  0
 .../test.py                                   | 24 +++++++------------
 2 files changed, 9 insertions(+), 15 deletions(-)
 rename tests/integration/{test_replicated_zk_conn_failure => test_cleanup_dir_after_bad_zk_conn}/__init__.py (100%)
 rename tests/integration/{test_replicated_zk_conn_failure => test_cleanup_dir_after_bad_zk_conn}/test.py (63%)

diff --git a/tests/integration/test_replicated_zk_conn_failure/__init__.py b/tests/integration/test_cleanup_dir_after_bad_zk_conn/__init__.py
similarity index 100%
rename from tests/integration/test_replicated_zk_conn_failure/__init__.py
rename to tests/integration/test_cleanup_dir_after_bad_zk_conn/__init__.py
diff --git a/tests/integration/test_replicated_zk_conn_failure/test.py b/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
similarity index 63%
rename from tests/integration/test_replicated_zk_conn_failure/test.py
rename to tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
index a860716ee82..ef31e8487be 100644
--- a/tests/integration/test_replicated_zk_conn_failure/test.py
+++ b/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
@@ -9,12 +9,12 @@ from helpers.network import PartitionManager
 # Test flow is as follows:
 # 1. Configure cluster with ZooKeeper and create a database.
 # 2. Drop all connections to ZooKeeper.
-# 3. Try creating the table and there would be a Poco:Exception.
+# 3. Try creating the table and there will be a Poco:Exception.
 # 4. Try creating the table again and there should not be any error
-# that indicates that the Directory for table already exists.
+# that indicates that the directory for table already exists.
 # 5. Final step is to restore ZooKeeper connection and verify that
-# the table creation and queries work.
-def test_replicated_zk_conn_failure():
+# the table creation works.
+def test_cleanup_dir_after_bad_zk_conn():
     cluster = ClickHouseCluster(__file__)
     node1 = cluster.add_instance('node1', with_zookeeper=True)
     try:
@@ -30,21 +30,15 @@ def test_replicated_zk_conn_failure():
         ORDER BY id;'''
         with PartitionManager() as pm:
             pm.drop_instance_zk_connections(node1)
-            time.sleep(5)
+            time.sleep(3)
             error = node1.query_and_get_error(query_create)
-            # Assert that there was net exception.
-            assert "Poco::Exception. Code: 1000" in error
-            # Assert that the exception was due to ZooKeeper connectivity.
-            assert "All connection tries failed while connecting to ZooKeeper" in error
-            # retry table creation
+            assert "Poco::Exception. Code: 1000" and \
+                   "All connection tries failed while connecting to ZooKeeper" in error
             error = node1.query_and_get_error(query_create)
-            # Should not expect any errors related to directory already existing
-            # and those should have been already cleaned up during the previous retry.
             assert "Directory for table data data/replica/test/ already exists" not in error
-            # restore ZooKeeper connections.
             pm.restore_instance_zk_connections(node1)
-            # retry create query and query the table created.
             node1.query(query_create)
-            assert "0\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
+            node1.query('''INSERT INTO replica.test VALUES (1, now())''')
+            assert "1\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
     finally:
         cluster.shutdown()

From 62428845a0fdcaaa19ecc5fd33f3ecd849104cf5 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 19:47:06 +0300
Subject: [PATCH 086/341] Bug in mutation

---
 src/Columns/ColumnVector.h                       |  7 ++++---
 .../0_stateless/01475_mutation_with_if.reference |  1 +
 .../0_stateless/01475_mutation_with_if.sql       | 16 ++++++++++++++++
 3 files changed, 21 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/01475_mutation_with_if.reference
 create mode 100644 tests/queries/0_stateless/01475_mutation_with_if.sql

diff --git a/src/Columns/ColumnVector.h b/src/Columns/ColumnVector.h
index 1090de556a0..55ab67d6214 100644
--- a/src/Columns/ColumnVector.h
+++ b/src/Columns/ColumnVector.h
@@ -7,6 +7,7 @@
 #include <common/unaligned.h>
 #include <Core/Field.h>
 #include <Core/BigInt.h>
+#include <Common/assert_cast.h>
 
 
 namespace DB
@@ -130,7 +131,7 @@ public:
 
     void insertFrom(const IColumn & src, size_t n) override
     {
-        data.push_back(static_cast<const Self &>(src).getData()[n]);
+        data.push_back(assert_cast<const Self &>(src).getData()[n]);
     }
 
     void insertData(const char * pos, size_t) override
@@ -205,14 +206,14 @@ public:
     /// This method implemented in header because it could be possibly devirtualized.
     int compareAt(size_t n, size_t m, const IColumn & rhs_, int nan_direction_hint) const override
     {
-        return CompareHelper<T>::compare(data[n], static_cast<const Self &>(rhs_).data[m], nan_direction_hint);
+        return CompareHelper<T>::compare(data[n], assert_cast<const Self &>(rhs_).data[m], nan_direction_hint);
     }
 
     void compareColumn(const IColumn & rhs, size_t rhs_row_num,
                        PaddedPODArray<UInt64> * row_indexes, PaddedPODArray<Int8> & compare_results,
                        int direction, int nan_direction_hint) const override
     {
-        return this->template doCompareColumn<Self>(static_cast<const Self &>(rhs), rhs_row_num, row_indexes,
+        return this->template doCompareColumn<Self>(assert_cast<const Self &>(rhs), rhs_row_num, row_indexes,
                                                     compare_results, direction, nan_direction_hint);
     }
 
diff --git a/tests/queries/0_stateless/01475_mutation_with_if.reference b/tests/queries/0_stateless/01475_mutation_with_if.reference
new file mode 100644
index 00000000000..2874a18147f
--- /dev/null
+++ b/tests/queries/0_stateless/01475_mutation_with_if.reference
@@ -0,0 +1 @@
+1	150
diff --git a/tests/queries/0_stateless/01475_mutation_with_if.sql b/tests/queries/0_stateless/01475_mutation_with_if.sql
new file mode 100644
index 00000000000..6f0ef8924be
--- /dev/null
+++ b/tests/queries/0_stateless/01475_mutation_with_if.sql
@@ -0,0 +1,16 @@
+DROP TABLE IF EXISTS mutation_table;
+CREATE TABLE mutation_table (
+    id int,
+    price Nullable(Int32)
+)
+ENGINE = MergeTree()
+PARTITION BY id
+ORDER BY id;
+
+INSERT INTO mutation_table (id, price) VALUES (1, 100);
+
+ALTER TABLE mutation_table UPDATE price = 150 WHERE id = 1 SETTINGS mutations_sync = 2;
+
+SELECT * FROM mutation_table;
+
+DROP TABLE IF EXISTS mutation_table;

From 9fa04cf48b1f2aa9288dbd026e37b7aae9e8a6f3 Mon Sep 17 00:00:00 2001
From: Peng Jian <pengjian.uestc@gmail.com>
Date: Thu, 10 Sep 2020 00:59:38 +0800
Subject: [PATCH 087/341] Add QueryMemoryLimitExceeded event

---
 src/Common/MemoryTracker.cpp | 7 +++++++
 src/Common/ProfileEvents.cpp | 1 +
 2 files changed, 8 insertions(+)

diff --git a/src/Common/MemoryTracker.cpp b/src/Common/MemoryTracker.cpp
index 9d073cf8dd8..5d51fc9f301 100644
--- a/src/Common/MemoryTracker.cpp
+++ b/src/Common/MemoryTracker.cpp
@@ -6,6 +6,7 @@
 #include <Common/Exception.h>
 #include <Common/formatReadable.h>
 #include <common/logger_useful.h>
+#include <Common/ProfileEvents.h>
 
 #include <atomic>
 #include <cmath>
@@ -22,6 +23,10 @@ namespace DB
     }
 }
 
+namespace ProfileEvents
+{
+    extern const Event QueryMemoryLimitExceeded;
+}
 
 static constexpr size_t log_peak_memory_usage_every = 1ULL << 30;
 
@@ -104,6 +109,7 @@ void MemoryTracker::alloc(Int64 size)
         /// Prevent recursion. Exception::ctor -> std::string -> new[] -> MemoryTracker::alloc
         auto untrack_lock = blocker.cancel(); // NOLINT
 
+        ProfileEvents::increment(ProfileEvents::QueryMemoryLimitExceeded);
         std::stringstream message;
         message << "Memory tracker";
         if (const auto * description = description_ptr.load(std::memory_order_relaxed))
@@ -136,6 +142,7 @@ void MemoryTracker::alloc(Int64 size)
         /// Prevent recursion. Exception::ctor -> std::string -> new[] -> MemoryTracker::alloc
         auto no_track = blocker.cancel(); // NOLINT
 
+        ProfileEvents::increment(ProfileEvents::QueryMemoryLimitExceeded);
         std::stringstream message;
         message << "Memory limit";
         if (const auto * description = description_ptr.load(std::memory_order_relaxed))
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 475e073d253..c9ff9642361 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -233,6 +233,7 @@
     M(S3WriteRequestsErrors, "Number of non-throttling errors in POST, DELETE, PUT and PATCH requests to S3 storage.") \
     M(S3WriteRequestsThrottling, "Number of 429 and 503 errors in POST, DELETE, PUT and PATCH requests to S3 storage.") \
     M(S3WriteRequestsRedirects, "Number of redirects in POST, DELETE, PUT and PATCH requests to S3 storage.") \
+    M(QueryMemoryLimitExceeded, "Number of times of memory limit exceeded for query.") \
 
 
 namespace ProfileEvents

From dee1fefeb472bebdfa4e15eb1b7ec7e428069f8a Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Wed, 9 Sep 2020 20:39:49 +0300
Subject: [PATCH 088/341] add more tests

---
 src/Storages/StorageReplicatedMergeTree.cpp   |  5 +-
 .../test.py                                   | 74 ++++++++++++-------
 2 files changed, 50 insertions(+), 29 deletions(-)

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index a1027a8be53..00dcc7aeb08 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -612,7 +612,10 @@ bool StorageReplicatedMergeTree::createTableIfNotExists(const StorageMetadataPtr
         return true;
     }
 
-    throw Exception("Cannot create table, because it is created concurrently every time or because of logical error", ErrorCodes::LOGICAL_ERROR);
+    /// Do not use LOGICAL_ERROR code, because it may happen if user has specified wrong zookeeper_path
+    throw Exception("Cannot create table, because it is created concurrently every time "
+                    "or because of wrong zookeeper_path "
+                    "or because of logical error", ErrorCodes::REPLICA_IS_ALREADY_EXIST);
 }
 
 void StorageReplicatedMergeTree::createReplica(const StorageMetadataPtr & metadata_snapshot)
diff --git a/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py b/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
index ef31e8487be..4cb243160a0 100644
--- a/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
+++ b/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
@@ -1,9 +1,21 @@
 import time
+import pytest
 
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
 
 
+cluster = ClickHouseCluster(__file__)
+node1 = cluster.add_instance('node1', with_zookeeper=True)
+
+@pytest.fixture(scope="module")
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
 # This tests if the data directory for a table is cleaned up if there is a Zookeeper
 # connection exception during a CreateQuery operation involving ReplicatedMergeTree tables.
 # Test flow is as follows:
@@ -14,31 +26,37 @@ from helpers.network import PartitionManager
 # that indicates that the directory for table already exists.
 # 5. Final step is to restore ZooKeeper connection and verify that
 # the table creation works.
-def test_cleanup_dir_after_bad_zk_conn():
-    cluster = ClickHouseCluster(__file__)
-    node1 = cluster.add_instance('node1', with_zookeeper=True)
-    try:
-        cluster.start()
-        node1.query("CREATE DATABASE replica;")
-        query_create = '''CREATE TABLE replica.test
-        (
-           id Int64,
-           event_time DateTime
-        )
-        Engine=ReplicatedMergeTree('/clickhouse/tables/replica/test', 'node1')
-        PARTITION BY toYYYYMMDD(event_time)
-        ORDER BY id;'''
-        with PartitionManager() as pm:
-            pm.drop_instance_zk_connections(node1)
-            time.sleep(3)
-            error = node1.query_and_get_error(query_create)
-            assert "Poco::Exception. Code: 1000" and \
-                   "All connection tries failed while connecting to ZooKeeper" in error
-            error = node1.query_and_get_error(query_create)
-            assert "Directory for table data data/replica/test/ already exists" not in error
-            pm.restore_instance_zk_connections(node1)
-            node1.query(query_create)
-            node1.query('''INSERT INTO replica.test VALUES (1, now())''')
-            assert "1\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
-    finally:
-        cluster.shutdown()
+def test_cleanup_dir_after_bad_zk_conn(start_cluster):
+    node1.query("CREATE DATABASE replica;")
+    query_create = '''CREATE TABLE replica.test
+    (
+       id Int64,
+       event_time DateTime
+    )
+    Engine=ReplicatedMergeTree('/clickhouse/tables/replica/test', 'node1')
+    PARTITION BY toYYYYMMDD(event_time)
+    ORDER BY id;'''
+    with PartitionManager() as pm:
+        pm.drop_instance_zk_connections(node1)
+        time.sleep(3)
+        error = node1.query_and_get_error(query_create)
+        assert "Poco::Exception. Code: 1000" and \
+               "All connection tries failed while connecting to ZooKeeper" in error
+        error = node1.query_and_get_error(query_create)
+        assert "Directory for table data data/replica/test/ already exists" not in error
+    node1.query(query_create)
+    node1.query('''INSERT INTO replica.test VALUES (1, now())''')
+    assert "1\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
+
+def test_cleanup_dir_after_wrong_replica_name(start_cluster):
+    node1.query("CREATE TABLE test2_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r1') ORDER BY n")
+    error = node1.query_and_get_error("CREATE TABLE test2_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r1') ORDER BY n")
+    assert "already exists" in error
+    node1.query("CREATE TABLE test_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r2') ORDER BY n")
+
+
+def test_cleanup_dir_after_wrong_zk_path(start_cluster):
+    node1.query("CREATE TABLE test3_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test3/', 'r1') ORDER BY n")
+    error = node1.query_and_get_error("CREATE TABLE test3_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/', 'r2') ORDER BY n")
+    assert "Cannot create" in error
+    node1.query("CREATE TABLE test3_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test3/', 'r2') ORDER BY n")

From 7304bad56fff15882c82a556a4bd8b197c65092b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 9 Sep 2020 20:51:05 +0300
Subject: [PATCH 089/341] Support for nested multiline comments

---
 src/Parsers/Lexer.cpp                         | 20 +++++++++++++++----
 .../01491_nested_multiline_comments.reference |  3 +++
 .../01491_nested_multiline_comments.sql       |  3 +++
 3 files changed, 22 insertions(+), 4 deletions(-)
 create mode 100644 tests/queries/0_stateless/01491_nested_multiline_comments.reference
 create mode 100644 tests/queries/0_stateless/01491_nested_multiline_comments.sql

diff --git a/src/Parsers/Lexer.cpp b/src/Parsers/Lexer.cpp
index baf547a0a1a..ffa8250a3f3 100644
--- a/src/Parsers/Lexer.cpp
+++ b/src/Parsers/Lexer.cpp
@@ -253,15 +253,27 @@ Token Lexer::nextTokenImpl()
                 else
                 {
                     ++pos;
+
+                    /// Nested multiline comments are supported according to the SQL standard.
+                    size_t nesting_level = 1;
+
                     while (pos + 2 <= end)
                     {
-                        /// This means that nested multiline comments are not supported.
-                        if (pos[0] == '*' && pos[1] == '/')
+                        if (pos[0] == '/' && pos[1] == '*')
                         {
                             pos += 2;
-                            return Token(TokenType::Comment, token_begin, pos);
+                            ++nesting_level;
                         }
-                        ++pos;
+                        else if (pos[0] == '*' && pos[1] == '/')
+                        {
+                            pos += 2;
+                            --nesting_level;
+
+                            if (nesting_level == 0)
+                                return Token(TokenType::Comment, token_begin, pos);
+                        }
+                        else
+                            ++pos;
                     }
                     return Token(TokenType::ErrorMultilineCommentIsNotClosed, token_begin, end);
                 }
diff --git a/tests/queries/0_stateless/01491_nested_multiline_comments.reference b/tests/queries/0_stateless/01491_nested_multiline_comments.reference
new file mode 100644
index 00000000000..e8183f05f5d
--- /dev/null
+++ b/tests/queries/0_stateless/01491_nested_multiline_comments.reference
@@ -0,0 +1,3 @@
+1
+1
+1
diff --git a/tests/queries/0_stateless/01491_nested_multiline_comments.sql b/tests/queries/0_stateless/01491_nested_multiline_comments.sql
new file mode 100644
index 00000000000..4c6f7634701
--- /dev/null
+++ b/tests/queries/0_stateless/01491_nested_multiline_comments.sql
@@ -0,0 +1,3 @@
+SELECT /*/**/*/ 1;
+SELECT /*a/*b*/c*/ 1;
+SELECT /*ab/*cd*/ef*/ 1;

From 453914b6b860dc558719269ab9af35828376fac7 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Wed, 9 Sep 2020 21:02:53 +0300
Subject: [PATCH 090/341] Update ProfileEvents.cpp

---
 src/Common/ProfileEvents.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index c9ff9642361..486cb7e1a6e 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -233,7 +233,7 @@
     M(S3WriteRequestsErrors, "Number of non-throttling errors in POST, DELETE, PUT and PATCH requests to S3 storage.") \
     M(S3WriteRequestsThrottling, "Number of 429 and 503 errors in POST, DELETE, PUT and PATCH requests to S3 storage.") \
     M(S3WriteRequestsRedirects, "Number of redirects in POST, DELETE, PUT and PATCH requests to S3 storage.") \
-    M(QueryMemoryLimitExceeded, "Number of times of memory limit exceeded for query.") \
+    M(QueryMemoryLimitExceeded, "Number of times when memory limit exceeded for query.") \
 
 
 namespace ProfileEvents

From 11ffbda7cc48082ec0c3a44dc34946cf03a9dc4a Mon Sep 17 00:00:00 2001
From: myrrc <me@myrrec.space>
Date: Wed, 9 Sep 2020 21:17:01 +0300
Subject: [PATCH 091/341] added the debugger info option

---
 src/Functions/CMakeLists.txt | 14 ++++++++++++--
 1 file changed, 12 insertions(+), 2 deletions(-)

diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index 78caabb6941..08eefec84d4 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -53,8 +53,18 @@ endif()
 
 target_include_directories(clickhouse_functions SYSTEM PRIVATE ${SPARSEHASH_INCLUDE_DIR})
 
-# Won't generate debug info for files with heavy template instantiation to achieve faster linking and lower size.
-target_compile_options(clickhouse_functions PRIVATE "-g0")
+option(STRIP_DEBUG_SYMBOLS_FUNCTIONS
+    "Do not generate debugger info for ClickHouse functions.
+    Provides faster linking and lower binary size.
+    Tradeoff is the inability to debug some source files with e.g. gdb
+    (empty stack frames and no local variables)." OFF)
+
+if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)
+    message(WARNING "Not generating debugger info for ClickHouse functions")
+    target_compile_options(clickhouse_functions PRIVATE "-g0")
+else()
+    message(STATUS "Generating debugger info for ClickHouse functions")
+endif()
 
 if (USE_ICU)
     target_link_libraries (clickhouse_functions PRIVATE ${ICU_LIBRARIES})

From 2a9ab482792cdadf0d4e2365c3d11494a3e38230 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitbar@yandex-team.ru>
Date: Tue, 8 Sep 2020 02:08:17 +0300
Subject: [PATCH 092/341] Use join() instead of detach() for the
 no_users_thread in StorageLiveView.

---
 src/Interpreters/Context.cpp                  |   8 +
 src/Interpreters/Context.h                    |   8 +-
 src/Interpreters/InterpreterDropQuery.h       |   1 +
 .../LiveView/LiveViewBlockInputStream.h       |  15 +-
 .../LiveView/LiveViewEventsBlockInputStream.h |  14 +-
 src/Storages/LiveView/StorageLiveView.cpp     | 144 +----------------
 src/Storages/LiveView/StorageLiveView.h       |  23 ++-
 .../LiveView/TemporaryLiveViewCleaner.cpp     | 148 ++++++++++++++++++
 .../LiveView/TemporaryLiveViewCleaner.h       |  51 ++++++
 src/Storages/ya.make                          |   1 +
 10 files changed, 233 insertions(+), 180 deletions(-)
 create mode 100644 src/Storages/LiveView/TemporaryLiveViewCleaner.cpp
 create mode 100644 src/Storages/LiveView/TemporaryLiveViewCleaner.h

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 70cf41a679c..3c4c095cc26 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -23,6 +23,7 @@
 #include <Storages/MergeTree/MergeTreeSettings.h>
 #include <Storages/CompressionCodecSelector.h>
 #include <Storages/StorageS3Settings.h>
+#include <Storages/LiveView/TemporaryLiveViewCleaner.h>
 #include <Disks/DiskLocal.h>
 #include <TableFunctions/TableFunctionFactory.h>
 #include <Interpreters/ActionLocksManager.h>
@@ -423,6 +424,7 @@ struct ContextShared
         if (system_logs)
             system_logs->shutdown();
 
+        TemporaryLiveViewCleaner::shutdown();
         DatabaseCatalog::shutdown();
 
         /// Preemptive destruction is important, because these objects may have a refcount to ContextShared (cyclic reference).
@@ -479,6 +481,12 @@ Context Context::createGlobal(ContextShared * shared)
     return res;
 }
 
+void Context::initGlobal()
+{
+    DatabaseCatalog::init(this);
+    TemporaryLiveViewCleaner::init(*this);
+}
+
 SharedContextHolder Context::createShared()
 {
     return SharedContextHolder(std::make_unique<ContextShared>());
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index c8d13baa9ae..743c92d56b5 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -445,11 +445,7 @@ public:
 
     void makeQueryContext() { query_context = this; }
     void makeSessionContext() { session_context = this; }
-    void makeGlobalContext()
-    {
-        global_context = this;
-        DatabaseCatalog::init(this);
-    }
+    void makeGlobalContext() { initGlobal(); global_context = this; }
 
     const Settings & getSettingsRef() const { return settings; }
 
@@ -622,6 +618,8 @@ public:
 private:
     std::unique_lock<std::recursive_mutex> getLock() const;
 
+    void initGlobal();
+
     /// Compute and set actual user settings, client_info.current_user should be set
     void calculateAccessRights();
 
diff --git a/src/Interpreters/InterpreterDropQuery.h b/src/Interpreters/InterpreterDropQuery.h
index 80bd6c6531a..b54736b5c21 100644
--- a/src/Interpreters/InterpreterDropQuery.h
+++ b/src/Interpreters/InterpreterDropQuery.h
@@ -10,6 +10,7 @@ namespace DB
 {
 class Context;
 using DatabaseAndTable = std::pair<DatabasePtr, StoragePtr>;
+class AccessRightsElements;
 
 /** Allow to either drop table with all its data (DROP),
   * or remove information about table (just forget) from server (DETACH),
diff --git a/src/Storages/LiveView/LiveViewBlockInputStream.h b/src/Storages/LiveView/LiveViewBlockInputStream.h
index 7cab2cb41ed..737e76754c5 100644
--- a/src/Storages/LiveView/LiveViewBlockInputStream.h
+++ b/src/Storages/LiveView/LiveViewBlockInputStream.h
@@ -16,27 +16,17 @@ class LiveViewBlockInputStream : public IBlockInputStream
 using NonBlockingResult = std::pair<Block, bool>;
 
 public:
-    ~LiveViewBlockInputStream() override
-    {
-        /// Start storage no users thread
-        /// if we are the last active user
-        if (!storage->is_dropped && blocks_ptr.use_count() < 3)
-            storage->startNoUsersThread(temporary_live_view_timeout_sec);
-    }
-
     LiveViewBlockInputStream(std::shared_ptr<StorageLiveView> storage_,
         std::shared_ptr<BlocksPtr> blocks_ptr_,
         std::shared_ptr<BlocksMetadataPtr> blocks_metadata_ptr_,
         std::shared_ptr<bool> active_ptr_,
         const bool has_limit_, const UInt64 limit_,
-        const UInt64 heartbeat_interval_sec_,
-        const UInt64 temporary_live_view_timeout_sec_)
+        const UInt64 heartbeat_interval_sec_)
         : storage(std::move(storage_)), blocks_ptr(std::move(blocks_ptr_)),
           blocks_metadata_ptr(std::move(blocks_metadata_ptr_)),
           active_ptr(std::move(active_ptr_)),
           has_limit(has_limit_), limit(limit_),
-          heartbeat_interval_usec(heartbeat_interval_sec_ * 1000000),
-          temporary_live_view_timeout_sec(temporary_live_view_timeout_sec_)
+          heartbeat_interval_usec(heartbeat_interval_sec_ * 1000000)
     {
         /// grab active pointer
         active = active_ptr.lock();
@@ -205,7 +195,6 @@ private:
     Int64 num_updates = -1;
     bool end_of_blocks = false;
     UInt64 heartbeat_interval_usec;
-    UInt64 temporary_live_view_timeout_sec;
     UInt64 last_event_timestamp_usec = 0;
 };
 
diff --git a/src/Storages/LiveView/LiveViewEventsBlockInputStream.h b/src/Storages/LiveView/LiveViewEventsBlockInputStream.h
index ac5e7e3d6fd..4060b17c1ed 100644
--- a/src/Storages/LiveView/LiveViewEventsBlockInputStream.h
+++ b/src/Storages/LiveView/LiveViewEventsBlockInputStream.h
@@ -34,13 +34,6 @@ class LiveViewEventsBlockInputStream : public IBlockInputStream
 using NonBlockingResult = std::pair<Block, bool>;
 
 public:
-    ~LiveViewEventsBlockInputStream() override
-    {
-        /// Start storage no users thread
-        /// if we are the last active user
-        if (!storage->is_dropped && blocks_ptr.use_count() < 3)
-            storage->startNoUsersThread(temporary_live_view_timeout_sec);
-    }
     /// length default -2 because we want LIMIT to specify number of updates so that LIMIT 1 waits for 1 update
     /// and LIMIT 0 just returns data without waiting for any updates
     LiveViewEventsBlockInputStream(std::shared_ptr<StorageLiveView> storage_,
@@ -48,14 +41,12 @@ public:
         std::shared_ptr<BlocksMetadataPtr> blocks_metadata_ptr_,
         std::shared_ptr<bool> active_ptr_,
         const bool has_limit_, const UInt64 limit_,
-        const UInt64 heartbeat_interval_sec_,
-        const UInt64 temporary_live_view_timeout_sec_)
+        const UInt64 heartbeat_interval_sec_)
         : storage(std::move(storage_)), blocks_ptr(std::move(blocks_ptr_)),
           blocks_metadata_ptr(std::move(blocks_metadata_ptr_)),
           active_ptr(std::move(active_ptr_)), has_limit(has_limit_),
           limit(limit_),
-          heartbeat_interval_usec(heartbeat_interval_sec_ * 1000000),
-          temporary_live_view_timeout_sec(temporary_live_view_timeout_sec_)
+          heartbeat_interval_usec(heartbeat_interval_sec_ * 1000000)
     {
         /// grab active pointer
         active = active_ptr.lock();
@@ -236,7 +227,6 @@ private:
     Int64 num_updates = -1;
     bool end_of_blocks = false;
     UInt64 heartbeat_interval_usec;
-    UInt64 temporary_live_view_timeout_sec;
     UInt64 last_event_timestamp_usec = 0;
     Poco::Timestamp timestamp;
 };
diff --git a/src/Storages/LiveView/StorageLiveView.cpp b/src/Storages/LiveView/StorageLiveView.cpp
index 54ac5bcc791..b16c02eec6b 100644
--- a/src/Storages/LiveView/StorageLiveView.cpp
+++ b/src/Storages/LiveView/StorageLiveView.cpp
@@ -12,10 +12,8 @@ limitations under the License. */
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTWatchQuery.h>
-#include <Parsers/ASTDropQuery.h>
 #include <Parsers/ASTLiteral.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/InterpreterDropQuery.h>
 #include <Interpreters/InterpreterSelectQuery.h>
 #include <DataStreams/IBlockOutputStream.h>
 #include <DataStreams/OneBlockInputStream.h>
@@ -31,6 +29,7 @@ limitations under the License. */
 #include <Storages/LiveView/LiveViewBlockOutputStream.h>
 #include <Storages/LiveView/LiveViewEventsBlockInputStream.h>
 #include <Storages/LiveView/StorageBlocks.h>
+#include <Storages/LiveView/TemporaryLiveViewCleaner.h>
 
 #include <Storages/StorageFactory.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
@@ -276,7 +275,7 @@ StorageLiveView::StorageLiveView(
     if (query.live_view_timeout)
     {
         is_temporary = true;
-        temporary_live_view_timeout = *query.live_view_timeout;
+        temporary_live_view_timeout = std::chrono::seconds{*query.live_view_timeout};
     }
 
     blocks_ptr = std::make_shared<BlocksPtr>();
@@ -384,128 +383,21 @@ void StorageLiveView::checkTableCanBeDropped() const
     }
 }
 
-void StorageLiveView::noUsersThread(std::shared_ptr<StorageLiveView> storage, const UInt64 & timeout)
-{
-    bool drop_table = false;
-
-    if (storage->shutdown_called)
-        return;
-
-    auto table_id = storage->getStorageID();
-    {
-        while (true)
-        {
-            std::unique_lock lock(storage->no_users_thread_wakeup_mutex);
-            if (!storage->no_users_thread_condition.wait_for(lock, std::chrono::seconds(timeout), [&] { return storage->no_users_thread_wakeup; }))
-            {
-                storage->no_users_thread_wakeup = false;
-                if (storage->shutdown_called)
-                    return;
-                if (storage->hasUsers())
-                    return;
-                if (!DatabaseCatalog::instance().getDependencies(table_id).empty())
-                    continue;
-                drop_table = true;
-            }
-            break;
-        }
-    }
-
-    if (drop_table)
-    {
-        if (DatabaseCatalog::instance().tryGetTable(table_id, storage->global_context))
-        {
-            try
-            {
-                /// We create and execute `drop` query for this table
-                auto drop_query = std::make_shared<ASTDropQuery>();
-                drop_query->database = table_id.database_name;
-                drop_query->table = table_id.table_name;
-                drop_query->kind = ASTDropQuery::Kind::Drop;
-                ASTPtr ast_drop_query = drop_query;
-                InterpreterDropQuery drop_interpreter(ast_drop_query, storage->global_context);
-                drop_interpreter.execute();
-            }
-            catch (...)
-            {
-                tryLogCurrentException(__PRETTY_FUNCTION__);
-            }
-        }
-    }
-}
-
-void StorageLiveView::startNoUsersThread(const UInt64 & timeout)
-{
-    bool expected = false;
-    if (!start_no_users_thread_called.compare_exchange_strong(expected, true))
-        return;
-
-    if (is_temporary)
-    {
-        std::lock_guard no_users_thread_lock(no_users_thread_mutex);
-
-        if (shutdown_called)
-            return;
-
-        if (no_users_thread.joinable())
-        {
-            {
-                std::lock_guard lock(no_users_thread_wakeup_mutex);
-                no_users_thread_wakeup = true;
-                no_users_thread_condition.notify_one();
-            }
-            no_users_thread.join();
-        }
-        {
-            std::lock_guard lock(no_users_thread_wakeup_mutex);
-            no_users_thread_wakeup = false;
-        }
-        if (!is_dropped)
-            no_users_thread = std::thread(&StorageLiveView::noUsersThread,
-                std::static_pointer_cast<StorageLiveView>(shared_from_this()), timeout);
-    }
-
-    start_no_users_thread_called = false;
-}
-
 void StorageLiveView::startup()
 {
-    startNoUsersThread(temporary_live_view_timeout);
+    if (is_temporary)
+        TemporaryLiveViewCleaner::instance().addView(std::static_pointer_cast<StorageLiveView>(shared_from_this()));
 }
 
 void StorageLiveView::shutdown()
 {
+    shutdown_called = true;
     DatabaseCatalog::instance().removeDependency(select_table_id, getStorageID());
-    bool expected = false;
-    if (!shutdown_called.compare_exchange_strong(expected, true))
-        return;
-
-    /// WATCH queries should be stopped after setting shutdown_called to true.
-    /// Otherwise livelock is possible for LiveView table in Atomic database:
-    /// WATCH query will wait for table to be dropped and DatabaseCatalog will wait for queries to finish
-
-    {
-        std::lock_guard no_users_thread_lock(no_users_thread_mutex);
-        if (no_users_thread.joinable())
-        {
-            {
-                std::lock_guard lock(no_users_thread_wakeup_mutex);
-                no_users_thread_wakeup = true;
-                no_users_thread_condition.notify_one();
-            }
-        }
-    }
 }
 
 StorageLiveView::~StorageLiveView()
 {
     shutdown();
-
-    {
-        std::lock_guard lock(no_users_thread_mutex);
-        if (no_users_thread.joinable())
-            no_users_thread.detach();
-    }
 }
 
 void StorageLiveView::drop()
@@ -572,18 +464,7 @@ BlockInputStreams StorageLiveView::watch(
         auto reader = std::make_shared<LiveViewEventsBlockInputStream>(
             std::static_pointer_cast<StorageLiveView>(shared_from_this()),
             blocks_ptr, blocks_metadata_ptr, active_ptr, has_limit, limit,
-            context.getSettingsRef().live_view_heartbeat_interval.totalSeconds(),
-            temporary_live_view_timeout);
-
-        {
-            std::lock_guard no_users_thread_lock(no_users_thread_mutex);
-            if (no_users_thread.joinable())
-            {
-                std::lock_guard lock(no_users_thread_wakeup_mutex);
-                no_users_thread_wakeup = true;
-                no_users_thread_condition.notify_one();
-            }
-        }
+            context.getSettingsRef().live_view_heartbeat_interval.totalSeconds());
 
         {
             std::lock_guard lock(mutex);
@@ -603,18 +484,7 @@ BlockInputStreams StorageLiveView::watch(
         auto reader = std::make_shared<LiveViewBlockInputStream>(
             std::static_pointer_cast<StorageLiveView>(shared_from_this()),
             blocks_ptr, blocks_metadata_ptr, active_ptr, has_limit, limit,
-            context.getSettingsRef().live_view_heartbeat_interval.totalSeconds(),
-            temporary_live_view_timeout);
-
-        {
-            std::lock_guard no_users_thread_lock(no_users_thread_mutex);
-            if (no_users_thread.joinable())
-            {
-                std::lock_guard lock(no_users_thread_wakeup_mutex);
-                no_users_thread_wakeup = true;
-                no_users_thread_condition.notify_one();
-            }
-        }
+            context.getSettingsRef().live_view_heartbeat_interval.totalSeconds());
 
         {
             std::lock_guard lock(mutex);
diff --git a/src/Storages/LiveView/StorageLiveView.h b/src/Storages/LiveView/StorageLiveView.h
index 43afd169a92..32e18ef6092 100644
--- a/src/Storages/LiveView/StorageLiveView.h
+++ b/src/Storages/LiveView/StorageLiveView.h
@@ -38,6 +38,10 @@ using ASTPtr = std::shared_ptr<IAST>;
 using BlocksMetadataPtr = std::shared_ptr<BlocksMetadata>;
 using MergeableBlocksPtr = std::shared_ptr<MergeableBlocks>;
 
+class Pipe;
+using Pipes = std::vector<Pipe>;
+
+
 class StorageLiveView final : public ext::shared_ptr_helper<StorageLiveView>, public IStorage
 {
 friend struct ext::shared_ptr_helper<StorageLiveView>;
@@ -70,7 +74,9 @@ public:
 
     NamesAndTypesList getVirtuals() const override;
 
-    bool isTemporary() { return is_temporary; }
+    bool isTemporary() const { return is_temporary; }
+    std::chrono::seconds getTimeout() const { return temporary_live_view_timeout; }
+
 
     /// Check if we have any readers
     /// must be called with mutex locked
@@ -85,11 +91,7 @@ public:
     {
         return active_ptr.use_count() > 1;
     }
-    /// No users thread mutex, predicate and wake up condition
-    void startNoUsersThread(const UInt64 & timeout);
-    std::mutex no_users_thread_wakeup_mutex;
-    bool no_users_thread_wakeup = false;
-    std::condition_variable no_users_thread_condition;
+
     /// Get blocks hash
     /// must be called with mutex locked
     String getBlocksHashKey()
@@ -175,6 +177,8 @@ private:
     std::unique_ptr<Context> live_view_context;
 
     bool is_temporary = false;
+    std::chrono::seconds temporary_live_view_timeout;
+
     /// Mutex to protect access to sample block and inner_blocks_query
     mutable std::mutex sample_block_lock;
     mutable Block sample_block;
@@ -193,14 +197,7 @@ private:
     std::shared_ptr<BlocksMetadataPtr> blocks_metadata_ptr;
     MergeableBlocksPtr mergeable_blocks;
 
-    /// Background thread for temporary tables
-    /// which drops this table if there are no users
-    static void noUsersThread(std::shared_ptr<StorageLiveView> storage, const UInt64 & timeout);
-    std::mutex no_users_thread_mutex;
-    std::thread no_users_thread;
     std::atomic<bool> shutdown_called = false;
-    std::atomic<bool> start_no_users_thread_called = false;
-    UInt64 temporary_live_view_timeout;
 
     StorageLiveView(
         const StorageID & table_id_,
diff --git a/src/Storages/LiveView/TemporaryLiveViewCleaner.cpp b/src/Storages/LiveView/TemporaryLiveViewCleaner.cpp
new file mode 100644
index 00000000000..0f7c1039d72
--- /dev/null
+++ b/src/Storages/LiveView/TemporaryLiveViewCleaner.cpp
@@ -0,0 +1,148 @@
+#include <Storages/LiveView/TemporaryLiveViewCleaner.h>
+#include <Storages/LiveView/StorageLiveView.h>
+#include <Interpreters/DatabaseCatalog.h>
+#include <Interpreters/InterpreterDropQuery.h>
+#include <Parsers/ASTDropQuery.h>
+
+
+namespace DB
+{
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+
+namespace
+{
+    void executeDropQuery(const StorageID & storage_id, Context & context)
+    {
+        if (!DatabaseCatalog::instance().isTableExist(storage_id, context))
+            return;
+        try
+        {
+            /// We create and execute `drop` query for this table
+            auto drop_query = std::make_shared<ASTDropQuery>();
+            drop_query->database = storage_id.database_name;
+            drop_query->table = storage_id.table_name;
+            drop_query->kind = ASTDropQuery::Kind::Drop;
+            ASTPtr ast_drop_query = drop_query;
+            InterpreterDropQuery drop_interpreter(ast_drop_query, context);
+            drop_interpreter.execute();
+        }
+        catch (...)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+        }
+    }
+}
+
+
+std::unique_ptr<TemporaryLiveViewCleaner> TemporaryLiveViewCleaner::the_instance;
+
+
+void TemporaryLiveViewCleaner::init(Context & global_context_)
+{
+    if (the_instance)
+        throw Exception("TemporaryLiveViewCleaner already initialized", ErrorCodes::LOGICAL_ERROR);
+    the_instance.reset(new TemporaryLiveViewCleaner(global_context_));
+}
+
+
+void TemporaryLiveViewCleaner::shutdown()
+{
+    the_instance.reset();
+}
+
+
+TemporaryLiveViewCleaner::TemporaryLiveViewCleaner(Context & global_context_)
+    : global_context(global_context_)
+{
+}
+
+
+TemporaryLiveViewCleaner::~TemporaryLiveViewCleaner()
+{
+    stopBackgroundThread();
+}
+
+
+void TemporaryLiveViewCleaner::addView(const std::shared_ptr<StorageLiveView> & view)
+{
+    if (!view->isTemporary())
+        return;
+
+    auto current_time = std::chrono::system_clock::now();
+    auto time_of_next_check = current_time + view->getTimeout();
+
+    std::lock_guard lock{mutex};
+
+    /// Keep the vector `views` sorted by time of next check.
+    StorageAndTimeOfCheck storage_and_time_of_check{view, time_of_next_check};
+    views.insert(std::upper_bound(views.begin(), views.end(), storage_and_time_of_check), storage_and_time_of_check);
+
+    if (!background_thread.joinable())
+        background_thread = ThreadFromGlobalPool{&TemporaryLiveViewCleaner::backgroundThreadFunc, this};
+
+    background_thread_wake_up.notify_one();
+}
+
+
+void TemporaryLiveViewCleaner::backgroundThreadFunc()
+{
+    std::unique_lock lock{mutex};
+    while (!background_thread_should_exit && !views.empty())
+    {
+        background_thread_wake_up.wait_until(lock, views.front().time_of_check);
+        if (background_thread_should_exit)
+            return;
+
+        auto current_time = std::chrono::system_clock::now();
+        std::vector<StorageID> storages_to_drop;
+
+        auto it = views.begin();
+        while (it != views.end())
+        {
+            std::shared_ptr<StorageLiveView> storage = it->storage.lock();
+            auto & time_of_check = it->time_of_check;
+            if (!storage)
+            {
+                /// Storage has been already removed.
+                it = views.erase(it);
+                continue;
+            }
+
+            ++it;
+
+            if (current_time < time_of_check)
+                break; /// It's not the time to check it yet.
+
+            time_of_check = current_time + storage->getTimeout();
+
+            auto storage_id = storage->getStorageID();
+            if (storage->hasUsers() || !DatabaseCatalog::instance().getDependencies(storage_id).empty())
+                continue;
+
+            storages_to_drop.emplace_back(storage_id);
+        }
+
+        lock.unlock();
+        for (const auto & storage_id : storages_to_drop)
+            executeDropQuery(storage_id, global_context);
+        lock.lock();
+    }
+}
+
+
+void TemporaryLiveViewCleaner::stopBackgroundThread()
+{
+    std::lock_guard lock{mutex};
+    if (background_thread.joinable())
+    {
+        background_thread_should_exit = true;
+        background_thread_wake_up.notify_one();
+        background_thread.join();
+    }
+}
+
+}
diff --git a/src/Storages/LiveView/TemporaryLiveViewCleaner.h b/src/Storages/LiveView/TemporaryLiveViewCleaner.h
new file mode 100644
index 00000000000..57c12bd1c07
--- /dev/null
+++ b/src/Storages/LiveView/TemporaryLiveViewCleaner.h
@@ -0,0 +1,51 @@
+#pragma once
+
+#include <Common/ThreadPool.h>
+#include <chrono>
+
+
+namespace DB
+{
+class StorageLiveView;
+struct StorageID;
+
+/// This class removes temporary live views in the background thread when it's possible.
+/// There should only a single instance of this class.
+class TemporaryLiveViewCleaner
+{
+public:
+    static TemporaryLiveViewCleaner & instance() { return *the_instance; }
+
+    /// Drops a specified live view after a while if it's temporary.
+    void addView(const std::shared_ptr<StorageLiveView> & view);
+
+    /// Should be called once.
+    static void init(Context & global_context_);
+    static void shutdown();
+
+private:
+    friend std::unique_ptr<TemporaryLiveViewCleaner>::deleter_type;
+
+    TemporaryLiveViewCleaner(Context & global_context_);
+    ~TemporaryLiveViewCleaner();
+
+    void backgroundThreadFunc();
+    void stopBackgroundThread();
+
+    struct StorageAndTimeOfCheck
+    {
+        std::weak_ptr<StorageLiveView> storage;
+        std::chrono::system_clock::time_point time_of_check;
+        bool operator <(const StorageAndTimeOfCheck & other) const { return time_of_check < other.time_of_check; }
+    };
+
+    static std::unique_ptr<TemporaryLiveViewCleaner> the_instance;
+    Context & global_context;
+    std::mutex mutex;
+    std::vector<StorageAndTimeOfCheck> views;
+    ThreadFromGlobalPool background_thread;
+    std::atomic<bool> background_thread_should_exit = false;
+    std::condition_variable background_thread_wake_up;
+};
+
+}
diff --git a/src/Storages/ya.make b/src/Storages/ya.make
index 1ddb8c77072..fed961ed2bb 100644
--- a/src/Storages/ya.make
+++ b/src/Storages/ya.make
@@ -20,6 +20,7 @@ SRCS(
     IStorage.cpp
     KeyDescription.cpp
     LiveView/StorageLiveView.cpp
+    LiveView/TemporaryLiveViewCleaner.cpp
     MergeTree/ActiveDataPartSet.cpp
     MergeTree/AllMergeSelector.cpp
     MergeTree/BackgroundProcessingPool.cpp

From b8a2c1d2a29517c2bd0e8f791ce31c474f30f7d5 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 22:45:37 +0300
Subject: [PATCH 093/341] Push pragma only for new gcc

---
 src/Storages/MergeTree/MergeTreePartition.cpp | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index 8ef3e458871..2802b842f54 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -29,8 +29,10 @@ String MergeTreePartition::getID(const MergeTreeData & storage) const
     return getID(storage.getInMemoryMetadataPtr()->getPartitionKey().sample_block);
 }
 
-#pragma GCC diagnostic push
-#pragma GCC diagnostic ignored "-Wstringop-overflow"
+#if defined (__GNUC__) && __GNUC__ >= 10
+    #pragma GCC diagnostic push
+    #pragma GCC diagnostic ignored "-Wstringop-overflow"
+#endif
 
 /// NOTE: This ID is used to create part names which are then persisted in ZK and as directory names on the file system.
 /// So if you want to change this method, be sure to guarantee compatibility with existing table data.
@@ -90,7 +92,9 @@ String MergeTreePartition::getID(const Block & partition_key_sample) const
     return result;
 }
 
-#pragma GCC diagnostic pop
+#if defined (__GNUC__) && __GNUC__ >= 10
+    #pragma GCC diagnostic pop
+#endif
 
 void MergeTreePartition::serializeText(const MergeTreeData & storage, WriteBuffer & out, const FormatSettings & format_settings) const
 {

From 7080d56470a9bfed57dde63ef2e40c9832599c72 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Wed, 9 Sep 2020 22:59:34 +0300
Subject: [PATCH 094/341] fix missed database name when altering mv

---
 src/Storages/SelectQueryDescription.cpp | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Storages/SelectQueryDescription.cpp b/src/Storages/SelectQueryDescription.cpp
index bb8295df6f3..0935a5be5ca 100644
--- a/src/Storages/SelectQueryDescription.cpp
+++ b/src/Storages/SelectQueryDescription.cpp
@@ -105,14 +105,14 @@ SelectQueryDescription SelectQueryDescription::getSelectQueryFromASTForMatView(c
     if (new_select.list_of_selects->children.size() != 1)
         throw Exception("UNION is not supported for MATERIALIZED VIEW", ErrorCodes::QUERY_IS_NOT_SUPPORTED_IN_MATERIALIZED_VIEW);
 
-    SelectQueryDescription result;
-
-    result.inner_query = new_select.list_of_selects->children.at(0)->clone();
-
-    auto & select_query = result.inner_query->as<ASTSelectQuery &>();
+    auto & new_inner_query = new_select.list_of_selects->children.at(0);
+    auto & select_query = new_inner_query->as<ASTSelectQuery &>();
     checkAllowedQueries(select_query);
+
+    SelectQueryDescription result;
     result.select_table_id = extractDependentTableFromSelectQuery(select_query, context);
-    result.select_query = select->clone();
+    result.select_query = new_select.clone();
+    result.inner_query = new_inner_query->clone();
 
     return result;
 }

From 27258c8e70213cf57e1bbf36176cda961d56e12f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 9 Sep 2020 23:47:42 +0300
Subject: [PATCH 095/341] utils/list-licenses/list-licenses.sh: ignore more
 files

- *.rtf

  They can have NULL byte, and StorageSystemLicenses.sh will warn:

      ./StorageSystemLicenses.sh: line 11: warning: command substitution: ignored null byte in input

  Found with:

      find contrib/ -type f -and '(' -iname 'LICENSE*' -or -iname 'COPYING*' -or -iname 'COPYRIGHT*' ')' -and -not -iname '*.html' | xargs grep -Pa '\x00'

- *.h
- *.cpp
- *.htm

And after verified with:

    $ find contrib/ -type f -and '(' -iname 'LICENSE*' -or -iname 'COPYING*' -or -iname 'COPYRIGHT*' ')' -and -not '(' -iname '*.html' -or -iname '*.htm' -or -iname '*.rtf' -or -name '*.cpp' -or -name '*.h' -or -iname '*.json' ')' | xargs file -b | sort -u
    ASCII text
    ASCII text, with CR line terminators
    ASCII text, with very long lines
    empty
    UTF-8 Unicode text
---
 utils/list-licenses/list-licenses.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/utils/list-licenses/list-licenses.sh b/utils/list-licenses/list-licenses.sh
index 987179e26a8..8eee3f97253 100755
--- a/utils/list-licenses/list-licenses.sh
+++ b/utils/list-licenses/list-licenses.sh
@@ -7,7 +7,7 @@ ls -1 -d ${LIBS_PATH}/*/ | grep -F -v -- '-cmake' | while read LIB; do
     LIB_NAME=$(basename $LIB)
 
     LIB_LICENSE=$(
-        LC_ALL=C find "$LIB" -type f -and '(' -iname 'LICENSE*' -or -iname 'COPYING*' -or -iname 'COPYRIGHT*' ')' -and -not -iname '*.html' -printf "%d\t%p\n" |
+        LC_ALL=C find "$LIB" -type f -and '(' -iname 'LICENSE*' -or -iname 'COPYING*' -or -iname 'COPYRIGHT*' ')' -and -not '(' -iname '*.html' -or -iname '*.htm' -or -iname '*.rtf' -or -name '*.cpp' -or -name '*.h' -or -iname '*.json' ')' -printf "%d\t%p\n" |
             awk '
                 BEGIN { IGNORECASE=1; min_depth = 0 }
                 /LICENSE/ { if (!min_depth || $1 <= min_depth) { min_depth = $1; license = $2 } }

From 0f4fdcbf389909ed2e642263b0d6a65a3580d8e0 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 10 Sep 2020 02:05:41 +0300
Subject: [PATCH 096/341] Pass -fsanitize-blacklist for TSAN only under clang
 (gcc does not support this)

And no such check for -fsnaitize=memory, since gcc does not support it
anyway.
---
 cmake/sanitize.cmake | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/cmake/sanitize.cmake b/cmake/sanitize.cmake
index 32443ed78c3..7c7e9c388a0 100644
--- a/cmake/sanitize.cmake
+++ b/cmake/sanitize.cmake
@@ -36,7 +36,15 @@ if (SANITIZE)
         endif ()
 
     elseif (SANITIZE STREQUAL "thread")
-        set (TSAN_FLAGS "-fsanitize=thread -fsanitize-blacklist=${CMAKE_SOURCE_DIR}/tests/tsan_suppressions.txt")
+        set (TSAN_FLAGS "-fsanitize=thread")
+        if (COMPILER_CLANG)
+            set (TSAN_FLAGS "${TSAN_FLAGS} -fsanitize-blacklist=${CMAKE_SOURCE_DIR}/tests/tsan_suppressions.txt")
+        else()
+            message (WARNING "TSAN suppressions was not passed to the compiler (since the compiler is not clang)")
+            message (WARNING "Use the following command to pass them manually:")
+            message (WARNING "    export TSAN_OPTIONS=\"$TSAN_OPTIONS suppressions=${CMAKE_SOURCE_DIR}/tests/tsan_suppressions.txt\"")
+        endif()
+
 
         set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${SAN_FLAGS} ${TSAN_FLAGS}")
         set (CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${SAN_FLAGS} ${TSAN_FLAGS}")

From 0a3f7d0fccc8b960d59b415b02313673d1bdc698 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Sat, 5 Sep 2020 19:49:47 -0700
Subject: [PATCH 097/341] AsynchronousMetricsLog - add improved tests

This adds integration tests to test the asynchronous_metric_log table
for event_time_microseconds field.

Asynchronous metrics are updated once every 60s, so this setting needs
to be overridden for having those metrics available in time so that the
tests can run. So the `asynchronous_metric_update_period_s` setting is
being overriden to be 2s.
---
 .../__init__.py                               |  0
 .../asynchronous_metrics_update_period_s.xml  |  3 ++
 .../test.py                                   | 32 +++++++++++++++++++
 .../01473_event_time_microseconds.reference   |  4 +--
 .../01473_event_time_microseconds.sql         | 12 ++++---
 5 files changed, 43 insertions(+), 8 deletions(-)
 create mode 100644 tests/integration/test_asynchronous_metric_log_table/__init__.py
 create mode 100644 tests/integration/test_asynchronous_metric_log_table/configs/asynchronous_metrics_update_period_s.xml
 create mode 100644 tests/integration/test_asynchronous_metric_log_table/test.py

diff --git a/tests/integration/test_asynchronous_metric_log_table/__init__.py b/tests/integration/test_asynchronous_metric_log_table/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_asynchronous_metric_log_table/configs/asynchronous_metrics_update_period_s.xml b/tests/integration/test_asynchronous_metric_log_table/configs/asynchronous_metrics_update_period_s.xml
new file mode 100644
index 00000000000..840c19f03a6
--- /dev/null
+++ b/tests/integration/test_asynchronous_metric_log_table/configs/asynchronous_metrics_update_period_s.xml
@@ -0,0 +1,3 @@
+<yandex>
+    <asynchronous_metrics_update_period_s>2</asynchronous_metrics_update_period_s>
+</yandex>
diff --git a/tests/integration/test_asynchronous_metric_log_table/test.py b/tests/integration/test_asynchronous_metric_log_table/test.py
new file mode 100644
index 00000000000..10face9abc6
--- /dev/null
+++ b/tests/integration/test_asynchronous_metric_log_table/test.py
@@ -0,0 +1,32 @@
+import time
+
+from helpers.cluster import ClickHouseCluster
+
+# Tests that the event_time_microseconds field in system.asynchronous_metric_log table gets populated.
+# asynchronous metrics are updated once every 60s by default. To make the test run faster, the setting
+# asynchronous_metric_update_period_s is being set to 2s so that the metrics are populated faster and
+# are available for querying during the test.
+def test_asynchronous_metric_log():
+    cluster = ClickHouseCluster(__file__)
+    node1 = cluster.add_instance('node1', with_zookeeper=True, main_configs=['configs/asynchronous_metrics_update_period_s.xml'])
+    try:
+        cluster.start()
+        node1.query("SET log_queries = 1;")
+        node1.query("CREATE DATABASE replica;")
+        query_create = '''CREATE TABLE replica.test
+        (
+           id Int64,
+           event_time DateTime
+        )
+        Engine=MergeTree()
+        PARTITION BY toYYYYMMDD(event_time)
+        ORDER BY id;'''
+        time.sleep(2)
+        node1.query(query_create)
+        node1.query('''INSERT INTO replica.test VALUES (1, now())''')
+        node1.query("SYSTEM FLUSH LOGS;")
+        node1.query("SELECT * FROM system.asynchronous_metrics LIMIT 10")
+        assert "1\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
+        assert "ok\n" in node1.query("SELECT If((select count(event_time_microseconds)  from system.asynchronous_metric_log) > 0, 'ok', 'fail');")
+    finally:
+        cluster.shutdown()
diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.reference b/tests/queries/0_stateless/01473_event_time_microseconds.reference
index cac87f32a29..8aa31f9ab6a 100644
--- a/tests/queries/0_stateless/01473_event_time_microseconds.reference
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.reference
@@ -1,4 +1,2 @@
-01473_asynchronous_metric_log_event_start_time_milliseconds_test
-ok
-01473_metric_log_event_start_time_milliseconds_test
+01473_metric_log_table_event_start_time_microseconds_test
 ok
diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.sql b/tests/queries/0_stateless/01473_event_time_microseconds.sql
index 6a13d6e1543..9bafd3bdbda 100644
--- a/tests/queries/0_stateless/01473_event_time_microseconds.sql
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.sql
@@ -1,9 +1,11 @@
+-- This file contains tests for the event_time_microseconds field for various tables.
+-- Note: Only event_time_microseconds for asynchronous_metric_log table is tested via
+-- an integration test as those metrics take 60s by default to be updated.
+-- Refer: tests/integration/test_asynchronous_metric_log_table.
+
 set log_queries = 1;
 
-select '01473_asynchronous_metric_log_event_start_time_milliseconds_test';
-system flush logs;
-SELECT If((select count(event_time_microseconds)  from system.asynchronous_metric_log) > 0, 'ok', 'fail'); -- success
-
-select '01473_metric_log_event_start_time_milliseconds_test';
+select '01473_metric_log_table_event_start_time_microseconds_test';
 system flush logs;
+SELECT sleep(3) Format Null;
 SELECT If((select count(event_time_microseconds)  from system.metric_log) > 0, 'ok', 'fail'); -- success

From 2ad63d2b4de47ca598712f9404a26ea53ba35e70 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Wed, 9 Sep 2020 17:56:21 -0700
Subject: [PATCH 098/341] AsynchronousMetricLog - refactor integration test

---
 .../test.py                                   | 23 +++++++++++++++----
 1 file changed, 19 insertions(+), 4 deletions(-)

diff --git a/tests/integration/test_asynchronous_metric_log_table/test.py b/tests/integration/test_asynchronous_metric_log_table/test.py
index 10face9abc6..9910a188e2c 100644
--- a/tests/integration/test_asynchronous_metric_log_table/test.py
+++ b/tests/integration/test_asynchronous_metric_log_table/test.py
@@ -1,14 +1,28 @@
 import time
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
+cluster = ClickHouseCluster(__file__)
+node1 = cluster.add_instance('node1', with_zookeeper=True,
+                             main_configs=['configs/asynchronous_metrics_update_period_s.xml'])
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
 # Tests that the event_time_microseconds field in system.asynchronous_metric_log table gets populated.
 # asynchronous metrics are updated once every 60s by default. To make the test run faster, the setting
 # asynchronous_metric_update_period_s is being set to 2s so that the metrics are populated faster and
 # are available for querying during the test.
-def test_asynchronous_metric_log():
-    cluster = ClickHouseCluster(__file__)
-    node1 = cluster.add_instance('node1', with_zookeeper=True, main_configs=['configs/asynchronous_metrics_update_period_s.xml'])
+def test_event_time_microseconds_field(started_cluster):
     try:
         cluster.start()
         node1.query("SET log_queries = 1;")
@@ -27,6 +41,7 @@ def test_asynchronous_metric_log():
         node1.query("SYSTEM FLUSH LOGS;")
         node1.query("SELECT * FROM system.asynchronous_metrics LIMIT 10")
         assert "1\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
-        assert "ok\n" in node1.query("SELECT If((select count(event_time_microseconds)  from system.asynchronous_metric_log) > 0, 'ok', 'fail');")
+        assert "ok\n" in node1.query(
+            "SELECT If((select count(event_time_microseconds)  from system.asynchronous_metric_log) > 0, 'ok', 'fail');")
     finally:
         cluster.shutdown()

From 31b0bd481c687160e2217a1443b244fad2733a04 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Thu, 10 Sep 2020 00:17:20 -0700
Subject: [PATCH 099/341] Integration tests - more accurate tests

---
 .../test.py                                   | 20 +++++++++++++++----
 .../01473_event_time_microseconds.sql         | 16 ++++++++++++++-
 2 files changed, 31 insertions(+), 5 deletions(-)

diff --git a/tests/integration/test_asynchronous_metric_log_table/test.py b/tests/integration/test_asynchronous_metric_log_table/test.py
index 9910a188e2c..0eb72c20376 100644
--- a/tests/integration/test_asynchronous_metric_log_table/test.py
+++ b/tests/integration/test_asynchronous_metric_log_table/test.py
@@ -39,9 +39,21 @@ def test_event_time_microseconds_field(started_cluster):
         node1.query(query_create)
         node1.query('''INSERT INTO replica.test VALUES (1, now())''')
         node1.query("SYSTEM FLUSH LOGS;")
-        node1.query("SELECT * FROM system.asynchronous_metrics LIMIT 10")
-        assert "1\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
-        assert "ok\n" in node1.query(
-            "SELECT If((select count(event_time_microseconds)  from system.asynchronous_metric_log) > 0, 'ok', 'fail');")
+        #query assumes that the event_time field is accurate
+        equals_query = '''WITH (
+                            (
+                                SELECT event_time_microseconds
+                                FROM system.asynchronous_metric_log
+                                ORDER BY event_time DESC
+                                LIMIT 1
+                            ) AS time_with_microseconds,
+                            (
+                                SELECT event_time
+                                FROM system.asynchronous_metric_log
+                                ORDER BY event_time DESC
+                                LIMIT 1
+                            ) AS time)
+                        SELECT if(dateDiff('second', toDateTime(time_with_microseconds), toDateTime(time)) = 0, 'ok', 'fail')'''
+        assert "ok\n" in node1.query(equals_query)
     finally:
         cluster.shutdown()
diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.sql b/tests/queries/0_stateless/01473_event_time_microseconds.sql
index 9bafd3bdbda..dd79a735d8f 100644
--- a/tests/queries/0_stateless/01473_event_time_microseconds.sql
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.sql
@@ -8,4 +8,18 @@ set log_queries = 1;
 select '01473_metric_log_table_event_start_time_microseconds_test';
 system flush logs;
 SELECT sleep(3) Format Null;
-SELECT If((select count(event_time_microseconds)  from system.metric_log) > 0, 'ok', 'fail'); -- success
+-- query assumes that the event_time field is accurate.
+WITH (
+    (
+        SELECT event_time_microseconds
+        FROM system.metric_log
+        ORDER BY event_time DESC
+        LIMIT 1
+    ) AS time_with_microseconds,
+    (
+        SELECT event_time
+        FROM system.metric_log
+        ORDER BY event_time DESC
+        LIMIT 1
+    ) AS time)
+SELECT if(dateDiff('second', toDateTime(time_with_microseconds), toDateTime(time)) = 0, 'ok', 'fail')

From 7fb45461d174c3ae122c9d11ba5a4414fe0d3fd6 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Thu, 10 Sep 2020 10:36:29 +0300
Subject: [PATCH 100/341] Try fix totals port for IAccumulatingTransform.

---
 src/Processors/IAccumulatingTransform.cpp | 16 +++++++---------
 1 file changed, 7 insertions(+), 9 deletions(-)

diff --git a/src/Processors/IAccumulatingTransform.cpp b/src/Processors/IAccumulatingTransform.cpp
index 2905d185df2..64bdbe2410f 100644
--- a/src/Processors/IAccumulatingTransform.cpp
+++ b/src/Processors/IAccumulatingTransform.cpp
@@ -49,13 +49,15 @@ IAccumulatingTransform::Status IAccumulatingTransform::prepare()
         return Status::Finished;
     }
 
-    /// Close input if flag was set manually.
+    if (input.isFinished())
+        finished_input = true;
+
     if (finished_input)
+    {
+        /// Close input if flag was set manually.
         input.close();
 
-    /// Read from totals port if has it.
-    if (input.isFinished())
-    {
+        /// Read from totals port if has it.
         if (inputs.size() > 1)
         {
             auto & totals_input = inputs.back();
@@ -69,12 +71,8 @@ IAccumulatingTransform::Status IAccumulatingTransform::prepare()
                 totals_input.close();
             }
         }
-    }
 
-    /// Generate output block.
-    if (input.isFinished())
-    {
-        finished_input = true;
+        /// Generate output block.
         return Status::Ready;
     }
 

From a64473313971bbd3d461d5c7b68165b39d4515e0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Thu, 10 Sep 2020 12:05:57 +0300
Subject: [PATCH 101/341] Attempt to make performance test more reliable

---
 programs/server/Server.cpp     |   8 +-
 src/Common/remapExecutable.cpp | 213 +++++++++++++++++++++++++++++++++
 src/Common/remapExecutable.h   |   7 ++
 3 files changed, 227 insertions(+), 1 deletion(-)
 create mode 100644 src/Common/remapExecutable.cpp
 create mode 100644 src/Common/remapExecutable.h

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index f24ba444203..8149623ffce 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -32,6 +32,7 @@
 #include <Common/getExecutablePath.h>
 #include <Common/ThreadProfileEvents.h>
 #include <Common/ThreadStatus.h>
+#include <Common/remapExecutable.h>
 #include <IO/HTTPCommon.h>
 #include <IO/UseSSL.h>
 #include <Interpreters/AsynchronousMetrics.h>
@@ -307,6 +308,11 @@ int Server::main(const std::vector<std::string> & /*args*/)
     {
         if (config().getBool("mlock_executable", false))
         {
+            LOG_DEBUG(log, "Will remap executable in memory.");
+            remapExecutable();
+            LOG_DEBUG(log, "The code in memory has been successfully remapped.");
+
+/*
             if (hasLinuxCapability(CAP_IPC_LOCK))
             {
                 LOG_TRACE(log, "Will mlockall to prevent executable memory from being paged out. It may take a few seconds.");
@@ -321,7 +327,7 @@ int Server::main(const std::vector<std::string> & /*args*/)
                     " It could happen due to incorrect ClickHouse package installation."
                     " You could resolve the problem manually with 'sudo setcap cap_ipc_lock=+ep {}'."
                     " Note that it will not work on 'nosuid' mounted filesystems.", executable_path);
-            }
+            }*/
         }
     }
 #endif
diff --git a/src/Common/remapExecutable.cpp b/src/Common/remapExecutable.cpp
new file mode 100644
index 00000000000..f7f353a83c6
--- /dev/null
+++ b/src/Common/remapExecutable.cpp
@@ -0,0 +1,213 @@
+#if defined(__linux__) && defined(__amd64__) && defined(__SSE2__)
+
+#include <sys/mman.h>
+#include <unistd.h>
+#include <sys/syscall.h>
+
+#include <emmintrin.h>
+
+#include <utility>
+
+#include <Common/StringUtils/StringUtils.h>
+#include <Common/hex.h>
+#include <Common/Exception.h>
+#include <IO/ReadBufferFromFile.h>
+#include <IO/ReadHelpers.h>
+
+#include "remapExecutable.h"
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int CANNOT_ALLOCATE_MEMORY;
+}
+
+
+namespace
+{
+
+uintptr_t readAddressHex(DB::ReadBuffer & in)
+{
+    uintptr_t res = 0;
+    while (!in.eof())
+    {
+        if (isHexDigit(*in.position()))
+        {
+            res *= 16;
+            res += unhex(*in.position());
+            ++in.position();
+        }
+        else
+            break;
+    }
+    return res;
+}
+
+
+/** Find the address and size of the mapped memory region pointed by ptr.
+  */
+std::pair<void *, size_t> getMappedArea(void * ptr)
+{
+    using namespace DB;
+
+    uintptr_t uintptr = reinterpret_cast<uintptr_t>(ptr);
+    ReadBufferFromFile in("/proc/self/maps");
+
+    while (!in.eof())
+    {
+        uintptr_t begin = readAddressHex(in);
+        assertChar('-', in);
+        uintptr_t end = readAddressHex(in);
+        skipToNextLineOrEOF(in);
+
+        if (begin <= uintptr && uintptr < end)
+            return {reinterpret_cast<void *>(begin), end - begin};
+    }
+
+    throw Exception("Cannot find mapped area for pointer", ErrorCodes::LOGICAL_ERROR);
+}
+
+
+__attribute__((__noinline__)) int64_t our_syscall(...)
+{
+     __asm__ __volatile__ (R"(
+        movq %%rdi,%%rax;
+        movq %%rsi,%%rdi;
+        movq %%rdx,%%rsi;
+        movq %%rcx,%%rdx;
+        movq %%r8,%%r10;
+        movq %%r9,%%r8;
+        movq 8(%%rsp),%%r9;
+        syscall;
+        ret
+    )" : : : "memory");
+    return 0;
+}
+
+
+__attribute__((__always_inline__)) void our_memcpy(char * __restrict dst, const char * __restrict src, ssize_t n)
+{
+    while (n > 0)
+    {
+        _mm_storeu_si128(reinterpret_cast<__m128i *>(dst),
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(src)));
+
+        dst += 16;
+        src += 16;
+        n -= 16;
+    }
+}
+
+
+__attribute__((__noinline__)) void remapToHugeStep3(void * scratch, size_t size, size_t offset)
+{
+    /// The function should not use the stack, otherwise various optimizations, including "omit-frame-pointer" may break the code.
+
+    /// Unmap the scratch area.
+    our_syscall(SYS_munmap, scratch, size);
+
+    /** The return address of this function is pointing to scratch area (because it was called from there).
+      * But the scratch area no longer exists. We should correct the return address by subtracting the offset.
+      */
+    __asm__ __volatile__("subq %0, 8(%%rsp)" : : "r"(offset) : "memory");
+}
+
+
+__attribute__((__noinline__)) void remapToHugeStep2(void * begin, size_t size, void * scratch)
+{
+    /** Unmap old memory region with the code of our program.
+      * Our instruction pointer is located inside scratch area and this function can execute after old code is unmapped.
+      * But it cannot call any other functions because they are not available at usual addresses
+      * - that's why we have to use "our_syscall" and "our_memcpy" functions.
+      * (Relative addressing may continue to work but we should not assume that).
+      */
+
+    int64_t offset = reinterpret_cast<intptr_t>(scratch) - reinterpret_cast<intptr_t>(begin);
+    int64_t (*syscall_func)(...) = reinterpret_cast<int64_t (*)(...)>(reinterpret_cast<intptr_t>(our_syscall) + offset);
+
+    //char dot = '.';
+    //syscall_func(SYS_write, 2, &dot, 1);
+
+    int64_t munmap_res = syscall_func(SYS_munmap, begin, size);
+    if (munmap_res != 0)
+        return;
+
+    //syscall_func(SYS_write, 2, &dot, 1);
+
+    /// Map new anonymous memory region in place of old region with code.
+
+    int64_t mmap_res = syscall_func(SYS_mmap, begin, size, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS | MAP_FIXED, -1, 0);
+    if (-1 == mmap_res)
+        syscall_func(SYS_exit, 1);
+    //syscall_func(SYS_write, 2, &dot, 1);
+
+    /// As the memory region is anonymous, we can do madvise with MADV_HUGEPAGE.
+
+    syscall_func(SYS_madvise, begin, size, MADV_HUGEPAGE);
+    //syscall_func(SYS_write, 2, &dot, 1);
+
+    /// Copy the code from scratch area to the old memory location.
+
+    our_memcpy(reinterpret_cast<char *>(begin), reinterpret_cast<const char *>(scratch), size);
+    //syscall_func(SYS_write, 2, &dot, 1);
+
+    /// Make the memory area with the code executable and non-writable.
+
+    syscall_func(SYS_mprotect, begin, size, PROT_READ | PROT_EXEC);
+    //syscall_func(SYS_write, 2, &dot, 1);
+
+    /** Step 3 function should unmap the scratch area.
+      * The currently executed code is located in the scratch area and cannot be removed here.
+      * We have to call another function and use its address from the original location (not in scratch area).
+      * To do it, we obtain it's pointer and call by pointer.
+      */
+
+    void(* volatile step3)(void*, size_t, size_t) = remapToHugeStep3;
+    step3(scratch, size, offset);
+}
+
+
+__attribute__((__noinline__)) void remapToHugeStep1(void * begin, size_t size)
+{
+    /// Allocate scratch area and copy the code there.
+
+    void * scratch = mmap(nullptr, size, PROT_READ | PROT_WRITE | PROT_EXEC, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
+    if (MAP_FAILED == scratch)
+        throwFromErrno(fmt::format("Cannot mmap {} bytes", size), ErrorCodes::CANNOT_ALLOCATE_MEMORY);
+
+    memcpy(scratch, begin, size);
+
+    /// Offset to the scratch area from previous location.
+
+    int64_t offset = reinterpret_cast<intptr_t>(scratch) - reinterpret_cast<intptr_t>(begin);
+
+    /// Jump to the next function inside the scratch area.
+
+    reinterpret_cast<void(*)(void*, size_t, void*)>(reinterpret_cast<intptr_t>(remapToHugeStep2) + offset)(begin, size, scratch);
+}
+
+}
+
+
+void remapExecutable()
+{
+    auto [begin, size] = getMappedArea(reinterpret_cast<void *>(remapExecutable));
+    remapToHugeStep1(begin, size);
+}
+
+}
+
+#else
+
+namespace DB
+{
+
+void remapExecutable() {}
+
+}
+
+#endif
diff --git a/src/Common/remapExecutable.h b/src/Common/remapExecutable.h
new file mode 100644
index 00000000000..7acb61f13bd
--- /dev/null
+++ b/src/Common/remapExecutable.h
@@ -0,0 +1,7 @@
+namespace DB
+{
+
+/// This function tries to reallocate the code of the running program in a more efficient way.
+void remapExecutable();
+
+}

From 532d121100fc696fa2edb2d3dff863907850c218 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Thu, 10 Sep 2020 12:14:31 +0300
Subject: [PATCH 102/341] Fix typo

---
 src/Common/remapExecutable.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/remapExecutable.cpp b/src/Common/remapExecutable.cpp
index f7f353a83c6..ec8b1703b0a 100644
--- a/src/Common/remapExecutable.cpp
+++ b/src/Common/remapExecutable.cpp
@@ -163,7 +163,7 @@ __attribute__((__noinline__)) void remapToHugeStep2(void * begin, size_t size, v
     /** Step 3 function should unmap the scratch area.
       * The currently executed code is located in the scratch area and cannot be removed here.
       * We have to call another function and use its address from the original location (not in scratch area).
-      * To do it, we obtain it's pointer and call by pointer.
+      * To do it, we obtain its pointer and call by pointer.
       */
 
     void(* volatile step3)(void*, size_t, size_t) = remapToHugeStep3;

From 20b3823770f60feefcd73306141bc25875d87f9a Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Thu, 10 Sep 2020 13:21:13 +0300
Subject: [PATCH 103/341] do not remove directory on attach

---
 src/Storages/StorageReplicatedMergeTree.cpp         | 10 +++++++---
 .../test_cleanup_dir_after_bad_zk_conn/test.py      | 13 ++++++++++++-
 2 files changed, 19 insertions(+), 4 deletions(-)

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 00dcc7aeb08..908112c17ff 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -234,10 +234,11 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
         {
             current_zookeeper = global_context.getZooKeeper();
         }
-        catch (Poco::Exception & e)
+        catch (...)
         {
-            dropIfEmpty();
-            throw e;
+            if (!attach)
+                dropIfEmpty();
+            throw;
         }
     }
 
@@ -262,7 +263,10 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
     if (!current_zookeeper)
     {
         if (!attach)
+        {
+            dropIfEmpty();
             throw Exception("Can't create replicated table without ZooKeeper", ErrorCodes::NO_ZOOKEEPER);
+        }
 
         /// Do not activate the replica. It will be readonly.
         LOG_ERROR(log, "No ZooKeeper: table will be in readonly mode.");
diff --git a/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py b/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
index 4cb243160a0..ab2db469157 100644
--- a/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
+++ b/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
@@ -54,9 +54,20 @@ def test_cleanup_dir_after_wrong_replica_name(start_cluster):
     assert "already exists" in error
     node1.query("CREATE TABLE test_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r2') ORDER BY n")
 
-
 def test_cleanup_dir_after_wrong_zk_path(start_cluster):
     node1.query("CREATE TABLE test3_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test3/', 'r1') ORDER BY n")
     error = node1.query_and_get_error("CREATE TABLE test3_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/', 'r2') ORDER BY n")
     assert "Cannot create" in error
     node1.query("CREATE TABLE test3_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test3/', 'r2') ORDER BY n")
+
+def test_attach_without_zk(start_cluster):
+    node1.query("CREATE TABLE test4_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test4/', 'r1') ORDER BY n")
+    node1.query("DETACH TABLE test4_r1")
+    with PartitionManager() as pm:
+        pm._add_rule({'probability': 0.5, 'source': node1.ip_address, 'destination_port': 2181, 'action': 'DROP'})
+        try:
+            node1.query("ATTACH TABLE test4_r1")
+        except:
+            pass
+    node1.query("ATTACH TABLE IF NOT EXISTS test4_r1")
+    node1.query("SELECT * FROM test4_r1")

From c309f55c207d5e864f1b05200e2a706627163bac Mon Sep 17 00:00:00 2001
From: myrrc <me@myrrec.space>
Date: Thu, 10 Sep 2020 14:02:52 +0300
Subject: [PATCH 104/341] updated setting and added default value

---
 src/Functions/CMakeLists.txt             | 5 ++++-
 src/Functions/GatherUtils/CMakeLists.txt | 5 +++--
 src/Functions/URL/CMakeLists.txt         | 5 +++--
 src/Functions/array/CMakeLists.txt       | 5 +++--
 4 files changed, 13 insertions(+), 7 deletions(-)

diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index 08eefec84d4..b19266726ae 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -57,7 +57,10 @@ option(STRIP_DEBUG_SYMBOLS_FUNCTIONS
     "Do not generate debugger info for ClickHouse functions.
     Provides faster linking and lower binary size.
     Tradeoff is the inability to debug some source files with e.g. gdb
-    (empty stack frames and no local variables)." OFF)
+    (empty stack frames and no local variables)."
+    CMAKE_BUILD_TYPE_UC STREQUAL "RELEASE"
+    OR CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO"
+    OR CMAKE_BUILD_TYPE_UC STREQUAL "MINSIZEREL")
 
 if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)
     message(WARNING "Not generating debugger info for ClickHouse functions")
diff --git a/src/Functions/GatherUtils/CMakeLists.txt b/src/Functions/GatherUtils/CMakeLists.txt
index 921b06fb1c2..3f7f08621a1 100644
--- a/src/Functions/GatherUtils/CMakeLists.txt
+++ b/src/Functions/GatherUtils/CMakeLists.txt
@@ -3,5 +3,6 @@ add_headers_and_sources(clickhouse_functions_gatherutils .)
 add_library(clickhouse_functions_gatherutils ${clickhouse_functions_gatherutils_sources} ${clickhouse_functions_gatherutils_headers})
 target_link_libraries(clickhouse_functions_gatherutils PRIVATE dbms)
 
-# Won't generate debug info for files with heavy template instantiation to achieve faster linking and lower size.
-target_compile_options(clickhouse_functions_gatherutils PRIVATE "-g0")
+if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)
+    target_compile_options(clickhouse_functions_gatherutils PRIVATE "-g0")
+endif()
diff --git a/src/Functions/URL/CMakeLists.txt b/src/Functions/URL/CMakeLists.txt
index 72fdc3174fc..0cf02fd524f 100644
--- a/src/Functions/URL/CMakeLists.txt
+++ b/src/Functions/URL/CMakeLists.txt
@@ -3,8 +3,9 @@ add_headers_and_sources(clickhouse_functions_url .)
 add_library(clickhouse_functions_url ${clickhouse_functions_url_sources} ${clickhouse_functions_url_headers})
 target_link_libraries(clickhouse_functions_url PRIVATE dbms)
 
-# Won't generate debug info for files with heavy template instantiation to achieve faster linking and lower size.
-target_compile_options(clickhouse_functions_url PRIVATE "-g0")
+if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)
+    target_compile_options(clickhouse_functions_url PRIVATE "-g0")
+endif()
 
 # TODO: move Functions/Regexps.h to some lib and use here
 target_link_libraries(clickhouse_functions_url PRIVATE hyperscan)
diff --git a/src/Functions/array/CMakeLists.txt b/src/Functions/array/CMakeLists.txt
index 32ef0216caa..1457e671261 100644
--- a/src/Functions/array/CMakeLists.txt
+++ b/src/Functions/array/CMakeLists.txt
@@ -3,5 +3,6 @@ add_headers_and_sources(clickhouse_functions_array .)
 add_library(clickhouse_functions_array ${clickhouse_functions_array_sources} ${clickhouse_functions_array_headers})
 target_link_libraries(clickhouse_functions_array PRIVATE dbms clickhouse_functions_gatherutils)
 
-# Won't generate debug info for files with heavy template instantiation to achieve faster linking and lower size.
-target_compile_options(clickhouse_functions_array PRIVATE "-g0")
+if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)
+    target_compile_options(clickhouse_functions_array PRIVATE "-g0")
+endif()

From 598c81ed0ac1e127136b54d167e9209e252818be Mon Sep 17 00:00:00 2001
From: myrrc <me@myrrec.space>
Date: Thu, 10 Sep 2020 14:07:08 +0300
Subject: [PATCH 105/341] fix: default value

---
 src/Functions/CMakeLists.txt | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index b19266726ae..4f6952aad8f 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -53,14 +53,21 @@ endif()
 
 target_include_directories(clickhouse_functions SYSTEM PRIVATE ${SPARSEHASH_INCLUDE_DIR})
 
+if (CMAKE_BUILD_TYPE_UC STREQUAL "RELEASE"
+    OR CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO"
+    OR CMAKE_BUILD_TYPE_UC STREQUAL "MINSIZEREL")
+    set (STRIP_DSF_DEFAULT ON)
+else()
+    set (STRIP_DSF_DEFAULT OFF)
+endif()
+
+
 option(STRIP_DEBUG_SYMBOLS_FUNCTIONS
     "Do not generate debugger info for ClickHouse functions.
     Provides faster linking and lower binary size.
     Tradeoff is the inability to debug some source files with e.g. gdb
     (empty stack frames and no local variables)."
-    CMAKE_BUILD_TYPE_UC STREQUAL "RELEASE"
-    OR CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO"
-    OR CMAKE_BUILD_TYPE_UC STREQUAL "MINSIZEREL")
+    STRIP_DSF_DEFAULT)
 
 if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)
     message(WARNING "Not generating debugger info for ClickHouse functions")

From 00b8d91eb859a2642a0583107498d4642c7d4348 Mon Sep 17 00:00:00 2001
From: BohuTANG <overred.shuttler@gmail.com>
Date: Thu, 10 Sep 2020 19:46:59 +0800
Subject: [PATCH 106/341] Fix mysql replication TableMapEvent optional metadata
 ignore

---
 src/Core/MySQL/IMySQLReadPacket.cpp           | 29 ++++++++++---------
 src/Core/MySQL/MySQLReplication.cpp           |  6 +++-
 src/Core/tests/mysql_protocol.cpp             |  1 +
 .../MySQL/MaterializeMySQLSyncThread.cpp      |  2 ++
 4 files changed, 23 insertions(+), 15 deletions(-)

diff --git a/src/Core/MySQL/IMySQLReadPacket.cpp b/src/Core/MySQL/IMySQLReadPacket.cpp
index 8fc8855c8a4..5f6bbc7bceb 100644
--- a/src/Core/MySQL/IMySQLReadPacket.cpp
+++ b/src/Core/MySQL/IMySQLReadPacket.cpp
@@ -50,21 +50,22 @@ uint64_t readLengthEncodedNumber(ReadBuffer & buffer)
     uint64_t buf = 0;
     buffer.readStrict(c);
     auto cc = static_cast<uint8_t>(c);
-    if (cc < 0xfc)
+    switch (cc)
     {
-        return cc;
-    }
-    else if (cc < 0xfd)
-    {
-        buffer.readStrict(reinterpret_cast<char *>(&buf), 2);
-    }
-    else if (cc < 0xfe)
-    {
-        buffer.readStrict(reinterpret_cast<char *>(&buf), 3);
-    }
-    else
-    {
-        buffer.readStrict(reinterpret_cast<char *>(&buf), 8);
+        /// NULL
+        case 0xfb:
+            break;
+        case 0xfc:
+            buffer.readStrict(reinterpret_cast<char *>(&buf), 2);
+            break;
+        case 0xfd:
+            buffer.readStrict(reinterpret_cast<char *>(&buf), 3);
+            break;
+        case 0xfe:
+            buffer.readStrict(reinterpret_cast<char *>(&buf), 8);
+            break;
+        default:
+            return cc;
     }
     return buf;
 }
diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index 42d077260f8..808e9d1a247 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -171,7 +171,9 @@ namespace MySQLReplication
 
         /// Ignore MySQL 8.0 optional metadata fields.
         /// https://mysqlhighavailability.com/more-metadata-is-written-into-binary-log/
-        payload.ignore(payload.available() - CHECKSUM_CRC32_SIGNATURE_LENGTH);
+        auto remain = payload.available();
+        if (remain > CHECKSUM_CRC32_SIGNATURE_LENGTH)
+           payload.ignore(remain);
     }
 
     /// Types that do not used in the binlog event:
@@ -221,6 +223,7 @@ namespace MySQLReplication
                 }
                 case MYSQL_TYPE_NEWDECIMAL:
                 case MYSQL_TYPE_STRING: {
+                    /// Big-Endian
                     auto b0 = UInt16(meta[pos] << 8);
                     auto b1 = UInt8(meta[pos + 1]);
                     column_meta.emplace_back(UInt16(b0 + b1));
@@ -231,6 +234,7 @@ namespace MySQLReplication
                 case MYSQL_TYPE_BIT:
                 case MYSQL_TYPE_VARCHAR:
                 case MYSQL_TYPE_VAR_STRING: {
+                    /// Little-Endian
                     auto b0 = UInt8(meta[pos]);
                     auto b1 = UInt16(meta[pos + 1] << 8);
                     column_meta.emplace_back(UInt16(b0 + b1));
diff --git a/src/Core/tests/mysql_protocol.cpp b/src/Core/tests/mysql_protocol.cpp
index acae8603c40..6cad095fc85 100644
--- a/src/Core/tests/mysql_protocol.cpp
+++ b/src/Core/tests/mysql_protocol.cpp
@@ -283,6 +283,7 @@ int main(int argc, char ** argv)
     }
 
     {
+        /// mysql_protocol --host=172.17.0.3 --user=root --password=123 --db=sbtest
         try
         {
             boost::program_options::options_description desc("Allowed options");
diff --git a/src/Databases/MySQL/MaterializeMySQLSyncThread.cpp b/src/Databases/MySQL/MaterializeMySQLSyncThread.cpp
index 851ea351876..465a7cb912a 100644
--- a/src/Databases/MySQL/MaterializeMySQLSyncThread.cpp
+++ b/src/Databases/MySQL/MaterializeMySQLSyncThread.cpp
@@ -195,6 +195,7 @@ void MaterializeMySQLSyncThread::synchronization(const String & mysql_version)
     }
     catch (...)
     {
+        client.disconnect();
         tryLogCurrentException(log);
         getDatabase(database_name).setException(std::current_exception());
     }
@@ -206,6 +207,7 @@ void MaterializeMySQLSyncThread::stopSynchronization()
     {
         sync_quit = true;
         background_thread_pool->join();
+        client.disconnect();
     }
 }
 

From e0081980230e636545a43a67238dc25b44f7777c Mon Sep 17 00:00:00 2001
From: myrrc <me@myrrec.space>
Date: Thu, 10 Sep 2020 15:44:49 +0300
Subject: [PATCH 107/341] fix: default value

---
 src/Functions/CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index 4f6952aad8f..0a99a034a33 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -67,7 +67,7 @@ option(STRIP_DEBUG_SYMBOLS_FUNCTIONS
     Provides faster linking and lower binary size.
     Tradeoff is the inability to debug some source files with e.g. gdb
     (empty stack frames and no local variables)."
-    STRIP_DSF_DEFAULT)
+    ${STRIP_DSF_DEFAULT})
 
 if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)
     message(WARNING "Not generating debugger info for ClickHouse functions")

From 65e9c678f8990756ac22ad2ad10bc08a9c0ec4b4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Thu, 10 Sep 2020 17:47:02 +0300
Subject: [PATCH 108/341] Disable under certain conditions

---
 src/Common/remapExecutable.cpp | 2 +-
 src/Common/ya.make             | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Common/remapExecutable.cpp b/src/Common/remapExecutable.cpp
index ec8b1703b0a..b41fece0c79 100644
--- a/src/Common/remapExecutable.cpp
+++ b/src/Common/remapExecutable.cpp
@@ -1,4 +1,4 @@
-#if defined(__linux__) && defined(__amd64__) && defined(__SSE2__)
+#if defined(__linux__) && defined(__amd64__) && defined(__SSE2__) && !defined(SANITIZER) && defined(NDEBUG)
 
 #include <sys/mman.h>
 #include <unistd.h>
diff --git a/src/Common/ya.make b/src/Common/ya.make
index d9a7a2ce4de..72f1fa42756 100644
--- a/src/Common/ya.make
+++ b/src/Common/ya.make
@@ -74,6 +74,7 @@ SRCS(
     QueryProfiler.cpp
     quoteString.cpp
     randomSeed.cpp
+    remapExecutable.cpp
     RemoteHostFilter.cpp
     renameat2.cpp
     RWLock.cpp

From f19f02028b7dca3844127a550c8703a8f40fc383 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Thu, 10 Sep 2020 17:50:10 +0300
Subject: [PATCH 109/341] fix misleading exception message about uuid macro

---
 src/Common/Macros.cpp                               | 8 +++++++-
 src/Storages/MergeTree/registerStorageMergeTree.cpp | 9 +++++----
 2 files changed, 12 insertions(+), 5 deletions(-)

diff --git a/src/Common/Macros.cpp b/src/Common/Macros.cpp
index 7b5a896015b..a4981fa5be3 100644
--- a/src/Common/Macros.cpp
+++ b/src/Common/Macros.cpp
@@ -68,8 +68,14 @@ String Macros::expand(const String & s,
             res += database_name;
         else if (macro_name == "table" && !table_name.empty())
             res += table_name;
-        else if (macro_name == "uuid" && uuid != UUIDHelpers::Nil)
+        else if (macro_name == "uuid")
+        {
+            if (uuid == UUIDHelpers::Nil)
+                throw Exception("Macro 'uuid' and empty arguments of ReplicatedMergeTree "
+                                "are supported only for ON CLUSTER queries with Atomic database engine",
+                                ErrorCodes::SYNTAX_ERROR);
             res += toString(uuid);
+        }
         else
             throw Exception("No macro '" + macro_name +
                 "' in config while processing substitutions in '" + s + "' at '"
diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index b0c422bd79f..d3af3942428 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -395,9 +395,10 @@ static StoragePtr create(const StorageFactory::Arguments & args)
 
     if (replicated)
     {
-        bool has_arguments = arg_num + 2 <= arg_cnt && engine_args[arg_num]->as<ASTLiteral>() && engine_args[arg_num + 1]->as<ASTLiteral>();
+        bool has_arguments = arg_num + 2 <= arg_cnt;
+        bool has_valid_arguments = has_arguments && engine_args[arg_num]->as<ASTLiteral>() && engine_args[arg_num + 1]->as<ASTLiteral>();
 
-        if (has_arguments)
+        if (has_valid_arguments)
         {
             const auto * ast = engine_args[arg_num]->as<ASTLiteral>();
             if (ast && ast->value.getType() == Field::Types::String)
@@ -420,7 +421,7 @@ static StoragePtr create(const StorageFactory::Arguments & args)
                     "No replica name in config" + getMergeTreeVerboseHelp(is_extended_storage_def), ErrorCodes::NO_REPLICA_NAME_GIVEN);
             ++arg_num;
         }
-        else if (is_extended_storage_def)
+        else if (is_extended_storage_def && !has_arguments)
         {
             /// Try use default values if arguments are not specified.
             /// It works for ON CLUSTER queries when database engine is Atomic and there are {shard} and {replica} in config.
@@ -428,7 +429,7 @@ static StoragePtr create(const StorageFactory::Arguments & args)
             replica_name = "{replica}"; /// TODO maybe use hostname if {replica} is not defined?
         }
         else
-            throw Exception("Expected zookeper_path and replica_name arguments", ErrorCodes::BAD_ARGUMENTS);
+            throw Exception("Expected two string literal arguments: zookeper_path and replica_name", ErrorCodes::BAD_ARGUMENTS);
 
         /// Allow implicit {uuid} macros only for zookeeper_path in ON CLUSTER queries
         bool is_on_cluster = args.local_context.getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY;

From ca2a33008b291bc5d1507b568ac31d588a6aa3d8 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Wed, 2 Sep 2020 19:42:24 +0300
Subject: [PATCH 110/341] faster

---
 docker/test/performance-comparison/eqmed.sql | 4 ++--
 docker/test/performance-comparison/perf.py   | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/performance-comparison/eqmed.sql b/docker/test/performance-comparison/eqmed.sql
index f7f8d6ac40d..139f0758798 100644
--- a/docker/test/performance-comparison/eqmed.sql
+++ b/docker/test/performance-comparison/eqmed.sql
@@ -8,7 +8,7 @@ select
 from
    (
       -- quantiles of randomization distributions
-      select quantileExactForEach(0.999)(
+      select quantileExactForEach(0.99)(
         arrayMap(x, y -> abs(x - y), metrics_by_label[1], metrics_by_label[2]) as d
       ) threshold
       ---- uncomment to see what the distribution is really like
@@ -33,7 +33,7 @@ from
                                 -- strip the query away before the join -- it might be several kB long;
                                 (select metrics, run, version from table) no_query,
                                 -- duplicate input measurements into many virtual runs
-                                numbers(1, 100000) nn
+                                numbers(1, 10000) nn
                               -- for each virtual run, randomly reorder measurements
                               order by virtual_run, rand()
                            ) virtual_runs
diff --git a/docker/test/performance-comparison/perf.py b/docker/test/performance-comparison/perf.py
index e1476d9aeb4..05e89c9e44c 100755
--- a/docker/test/performance-comparison/perf.py
+++ b/docker/test/performance-comparison/perf.py
@@ -20,7 +20,7 @@ parser = argparse.ArgumentParser(description='Run performance test.')
 parser.add_argument('file', metavar='FILE', type=argparse.FileType('r', encoding='utf-8'), nargs=1, help='test description file')
 parser.add_argument('--host', nargs='*', default=['localhost'], help="Server hostname(s). Corresponds to '--port' options.")
 parser.add_argument('--port', nargs='*', default=[9000], help="Server port(s). Corresponds to '--host' options.")
-parser.add_argument('--runs', type=int, default=int(os.environ.get('CHPC_RUNS', 13)), help='Number of query runs per server. Defaults to CHPC_RUNS environment variable.')
+parser.add_argument('--runs', type=int, default=int(os.environ.get('CHPC_RUNS', 7)), help='Number of query runs per server. Defaults to CHPC_RUNS environment variable.')
 parser.add_argument('--long', action='store_true', help='Do not skip the tests tagged as long.')
 parser.add_argument('--print-queries', action='store_true', help='Print test queries and exit.')
 parser.add_argument('--print-settings', action='store_true', help='Print test settings and exit.')

From 26348ad0143f881c8d14e41e0c80d706614ab110 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Thu, 10 Sep 2020 18:48:39 +0300
Subject: [PATCH 111/341] fixup

---
 docker/test/performance-comparison/report.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/performance-comparison/report.py b/docker/test/performance-comparison/report.py
index 1003a6d0e1a..b3f8ef01138 100755
--- a/docker/test/performance-comparison/report.py
+++ b/docker/test/performance-comparison/report.py
@@ -372,7 +372,7 @@ if args.report == 'main':
             'New,&nbsp;s',                                          # 1
             'Ratio of speedup&nbsp;(-) or slowdown&nbsp;(+)',                 # 2
             'Relative difference (new&nbsp;&minus;&nbsp;old) / old',   # 3
-            'p&nbsp;<&nbsp;0.001 threshold',                   # 4
+            'p&nbsp;<&nbsp;0.01 threshold',                   # 4
             # Failed                                           # 5
             'Test',                                            # 6
             '#',                                               # 7
@@ -416,7 +416,7 @@ if args.report == 'main':
             'Old,&nbsp;s', #0
             'New,&nbsp;s', #1
             'Relative difference (new&nbsp;-&nbsp;old)/old', #2
-            'p&nbsp;&lt;&nbsp;0.001 threshold', #3
+            'p&nbsp;&lt;&nbsp;0.01 threshold', #3
             # Failed #4
             'Test', #5
             '#',    #6
@@ -649,7 +649,7 @@ elif args.report == 'all-queries':
             'New,&nbsp;s', #3
             'Ratio of speedup&nbsp;(-) or slowdown&nbsp;(+)',                 #4
             'Relative difference (new&nbsp;&minus;&nbsp;old) / old', #5
-            'p&nbsp;&lt;&nbsp;0.001 threshold',          #6
+            'p&nbsp;&lt;&nbsp;0.01 threshold',          #6
             'Test',                                   #7
             '#',                                      #8
             'Query',                                  #9

From 397ebdb855c75be3df9f6a007a4e2cf3d0321bb5 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Thu, 10 Sep 2020 08:55:39 -0700
Subject: [PATCH 112/341] remove sleep from unit test

---
 .../configs/asynchronous_metrics_update_period_s.xml            | 2 +-
 tests/queries/0_stateless/01473_event_time_microseconds.sql     | 1 -
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/integration/test_asynchronous_metric_log_table/configs/asynchronous_metrics_update_period_s.xml b/tests/integration/test_asynchronous_metric_log_table/configs/asynchronous_metrics_update_period_s.xml
index 840c19f03a6..b658b0436b1 100644
--- a/tests/integration/test_asynchronous_metric_log_table/configs/asynchronous_metrics_update_period_s.xml
+++ b/tests/integration/test_asynchronous_metric_log_table/configs/asynchronous_metrics_update_period_s.xml
@@ -1,3 +1,3 @@
 <yandex>
-    <asynchronous_metrics_update_period_s>2</asynchronous_metrics_update_period_s>
+    <asynchronous_metrics_update_period_s>1</asynchronous_metrics_update_period_s>
 </yandex>
diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.sql b/tests/queries/0_stateless/01473_event_time_microseconds.sql
index dd79a735d8f..138df77ffec 100644
--- a/tests/queries/0_stateless/01473_event_time_microseconds.sql
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.sql
@@ -7,7 +7,6 @@ set log_queries = 1;
 
 select '01473_metric_log_table_event_start_time_microseconds_test';
 system flush logs;
-SELECT sleep(3) Format Null;
 -- query assumes that the event_time field is accurate.
 WITH (
     (

From 964c18241cabe7566f2e639190c143d8f9c7ca2b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Thu, 10 Sep 2020 19:04:53 +0300
Subject: [PATCH 113/341] Added test from #13829

---
 tests/queries/0_stateless/01492_array_join_crash_13829.reference | 0
 tests/queries/0_stateless/01492_array_join_crash_13829.sql       | 1 +
 2 files changed, 1 insertion(+)
 create mode 100644 tests/queries/0_stateless/01492_array_join_crash_13829.reference
 create mode 100644 tests/queries/0_stateless/01492_array_join_crash_13829.sql

diff --git a/tests/queries/0_stateless/01492_array_join_crash_13829.reference b/tests/queries/0_stateless/01492_array_join_crash_13829.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/01492_array_join_crash_13829.sql b/tests/queries/0_stateless/01492_array_join_crash_13829.sql
new file mode 100644
index 00000000000..9e11c3b69d4
--- /dev/null
+++ b/tests/queries/0_stateless/01492_array_join_crash_13829.sql
@@ -0,0 +1 @@
+SELECT NULL = countEqual(materialize([arrayJoin([NULL, NULL, NULL]), NULL AS x, arrayJoin([255, 1025, NULL, NULL]), arrayJoin([2, 1048576, NULL, NULL])]), materialize(x)) format Null;

From 3b3b7bd5e790ec6ef0dff61793c2790167ea3469 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Thu, 10 Sep 2020 09:09:48 -0700
Subject: [PATCH 114/341] minor changes to comment

---
 src/Storages/StorageReplicatedMergeTree.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 908112c17ff..feb2f95849c 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -226,10 +226,10 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
         /// This unclean state will hinder table creation on any retries and will
         /// complain that the Directory for table already exists.
         ///
-        /// To acheive a clean state on failed table creations, catch this error if
-        /// the excaption is of type Poco::Exception and call dropIfEmpty() method,
-        /// then proceed throwing the exception. Without this, the Directory for the
-        /// tables need to be manually deleted before retrying the CreateQuery.
+        /// To achieve a clean state on failed table creations, catch this error and
+        /// call dropIfEmpty() method only if the operation isn't ATTACH then proceed
+        /// throwing the exception. Without this, the Directory for the tables need
+        /// to be manually deleted before retrying the CreateQuery.
         try
         {
             current_zookeeper = global_context.getZooKeeper();

From 15bdb6048e610fb5787e581b7fa346bd7512e109 Mon Sep 17 00:00:00 2001
From: Artem Hnilov <boobsd@gmail.com>
Date: Thu, 10 Sep 2020 16:25:07 +0000
Subject: [PATCH 115/341] Function formatReadableQuantity() added.

---
 src/Functions/FunctionsFormatting.cpp |  1 +
 src/Functions/FunctionsFormatting.h   | 76 +++++++++++++++++++++++++++
 2 files changed, 77 insertions(+)

diff --git a/src/Functions/FunctionsFormatting.cpp b/src/Functions/FunctionsFormatting.cpp
index 7582e234622..1187749aa2d 100644
--- a/src/Functions/FunctionsFormatting.cpp
+++ b/src/Functions/FunctionsFormatting.cpp
@@ -9,6 +9,7 @@ void registerFunctionsFormatting(FunctionFactory & factory)
 {
     factory.registerFunction<FunctionBitmaskToList>();
     factory.registerFunction<FunctionFormatReadableSize>();
+    factory.registerFunction<FunctionFormatReadableQuantity>();
 }
 
 }
diff --git a/src/Functions/FunctionsFormatting.h b/src/Functions/FunctionsFormatting.h
index e11254e2775..da22babec38 100644
--- a/src/Functions/FunctionsFormatting.h
+++ b/src/Functions/FunctionsFormatting.h
@@ -202,4 +202,80 @@ private:
     }
 };
 
+
+class FunctionFormatReadableQuantity : public IFunction
+{
+public:
+    static constexpr auto name = "formatReadableQuantity";
+    static FunctionPtr create(const Context &) { return std::make_shared<FunctionFormatReadableQuantity>(); }
+
+    String getName() const override
+    {
+        return name;
+    }
+
+    size_t getNumberOfArguments() const override { return 1; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        const IDataType & type = *arguments[0];
+
+        if (!isNativeNumber(type))
+            throw Exception("Cannot format " + type.getName() + " as quantity", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        return std::make_shared<DataTypeString>();
+    }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /*input_rows_count*/) const override
+    {
+        if (!(executeType<UInt8>(block, arguments, result)
+            || executeType<UInt16>(block, arguments, result)
+            || executeType<UInt32>(block, arguments, result)
+            || executeType<UInt64>(block, arguments, result)
+            || executeType<Int8>(block, arguments, result)
+            || executeType<Int16>(block, arguments, result)
+            || executeType<Int32>(block, arguments, result)
+            || executeType<Int64>(block, arguments, result)
+            || executeType<Float32>(block, arguments, result)
+            || executeType<Float64>(block, arguments, result)))
+            throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
+                + " of argument of function " + getName(),
+                ErrorCodes::ILLEGAL_COLUMN);
+    }
+
+private:
+    template <typename T>
+    bool executeType(Block & block, const ColumnNumbers & arguments, size_t result) const
+    {
+        if (const ColumnVector<T> * col_from = checkAndGetColumn<ColumnVector<T>>(block.getByPosition(arguments[0]).column.get()))
+        {
+            auto col_to = ColumnString::create();
+
+            const typename ColumnVector<T>::Container & vec_from = col_from->getData();
+            ColumnString::Chars & data_to = col_to->getChars();
+            ColumnString::Offsets & offsets_to = col_to->getOffsets();
+            size_t size = vec_from.size();
+            data_to.resize(size * 2);
+            offsets_to.resize(size);
+
+            WriteBufferFromVector<ColumnString::Chars> buf_to(data_to);
+
+            for (size_t i = 0; i < size; ++i)
+            {
+                formatReadableQuantity(static_cast<double>(vec_from[i]), buf_to);
+                writeChar(0, buf_to);
+                offsets_to[i] = buf_to.count();
+            }
+
+            buf_to.finalize();
+            block.getByPosition(result).column = std::move(col_to);
+            return true;
+        }
+
+        return false;
+    }
+};
+
 }

From 6e0d2a427c4e1a3145d2ac33d6cc94040ffd95dc Mon Sep 17 00:00:00 2001
From: nikitamikhaylov <mikhaylovnikitka@gmail.com>
Date: Thu, 10 Sep 2020 19:30:11 +0300
Subject: [PATCH 116/341] add another test

---
 .../01460_line_as_string_format.reference     |  2 ++
 .../01460_line_as_string_format.sh            | 24 ++++++++++++++-----
 2 files changed, 20 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/01460_line_as_string_format.reference b/tests/queries/0_stateless/01460_line_as_string_format.reference
index dec67eb2e0a..c795fba4309 100644
--- a/tests/queries/0_stateless/01460_line_as_string_format.reference
+++ b/tests/queries/0_stateless/01460_line_as_string_format.reference
@@ -4,3 +4,5 @@
 "array" : [1, 2, 3],
 
 Finally implement this new feature.
+42	ClickHouse
+42	ClickHouse is a `fast` #open-source# (OLAP) database "management" :system:
diff --git a/tests/queries/0_stateless/01460_line_as_string_format.sh b/tests/queries/0_stateless/01460_line_as_string_format.sh
index a985bc207a8..60a960d2bf8 100755
--- a/tests/queries/0_stateless/01460_line_as_string_format.sh
+++ b/tests/queries/0_stateless/01460_line_as_string_format.sh
@@ -3,17 +3,29 @@
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS line_as_string";
-
-$CLICKHOUSE_CLIENT --query="CREATE TABLE line_as_string(field String) ENGINE = Memory";
+$CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS line_as_string1";
+$CLICKHOUSE_CLIENT --query="CREATE TABLE line_as_string1(field String) ENGINE = Memory";
 
 echo '"id" : 1,
 "date" : "01.01.2020",
 "string" : "123{{{\"\\",
 "array" : [1, 2, 3],
 
-Finally implement this new feature.' | $CLICKHOUSE_CLIENT --query="INSERT INTO line_as_string FORMAT LineAsString";
+Finally implement this new feature.' | $CLICKHOUSE_CLIENT --query="INSERT INTO line_as_string1 FORMAT LineAsString";
 
-$CLICKHOUSE_CLIENT --query="SELECT * FROM line_as_string";
-$CLICKHOUSE_CLIENT --query="DROP TABLE line_as_string"
+$CLICKHOUSE_CLIENT --query="SELECT * FROM line_as_string1";
+$CLICKHOUSE_CLIENT --query="DROP TABLE line_as_string1"
 
+$CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS line_as_string2";
+$CLICKHOUSE_CLIENT --query="create table line_as_string2(
+    a UInt64 default 42, 
+    b String materialized toString(a),
+    c String
+) engine=MergeTree() order by tuple();";
+
+$CLICKHOUSE_CLIENT --query="INSERT INTO line_as_string2(c) values ('ClickHouse')";
+
+echo 'ClickHouse is a `fast` #open-source# (OLAP) 'database' "management" :system:' | $CLICKHOUSE_CLIENT --query="INSERT INTO line_as_string2(c) FORMAT LineAsString";
+
+$CLICKHOUSE_CLIENT --query="SELECT * FROM line_as_string2 order by c";
+$CLICKHOUSE_CLIENT --query="DROP TABLE line_as_string2"

From d0c259974d1486dc90ae29958a3f1dd196052961 Mon Sep 17 00:00:00 2001
From: nikitamikhaylov <mikhaylovnikitka@gmail.com>
Date: Thu, 10 Sep 2020 19:35:18 +0300
Subject: [PATCH 117/341] style check

---
 .../Formats/Impl/LineAsStringRowInputFormat.cpp   | 15 ++++++---------
 src/Processors/ya.make                            |  2 +-
 2 files changed, 7 insertions(+), 10 deletions(-)

diff --git a/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
index 27bc71d764d..befc635386f 100644
--- a/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/LineAsStringRowInputFormat.cpp
@@ -8,8 +8,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int LOGICAL_ERROR;
-    extern const int INCORRECT_DATA;
+    extern const int INCORRECT_QUERY;
 }
 
 LineAsStringRowInputFormat::LineAsStringRowInputFormat(const Block & header_, ReadBuffer & in_, Params params_) :
@@ -17,7 +16,7 @@ LineAsStringRowInputFormat::LineAsStringRowInputFormat(const Block & header_, Re
 {
     if (header_.columns() > 1 || header_.getDataTypes()[0]->getTypeId() != TypeIndex::String)
     {
-        throw Exception("This input format is only suitable for tables with a single column of type String.", ErrorCodes::LOGICAL_ERROR);
+        throw Exception("This input format is only suitable for tables with a single column of type String.", ErrorCodes::INCORRECT_QUERY);
     }
 }
 
@@ -39,7 +38,8 @@ void LineAsStringRowInputFormat::readLineObject(IColumn & column)
     {
         pos = find_first_symbols<'\n', '\\'>(buf.position(), buf.buffer().end());
         buf.position() = pos;
-        if (buf.position() == buf.buffer().end())  {
+        if (buf.position() == buf.buffer().end())
+        {
             over = true;
             break;
         }
@@ -48,14 +48,11 @@ void LineAsStringRowInputFormat::readLineObject(IColumn & column)
             newline = false;
         }
         else if (*buf.position() == '\\')
-            {
+        {
             ++buf.position();
             if (!buf.eof())
-            {
-            	++buf.position();
-            }
+                ++buf.position();
         }
-        
     }
 
     buf.makeContinuousMemoryFromCheckpointToPos();
diff --git a/src/Processors/ya.make b/src/Processors/ya.make
index 8fe4e651ade..c69d274a70e 100644
--- a/src/Processors/ya.make
+++ b/src/Processors/ya.make
@@ -25,7 +25,6 @@ SRCS(
     Formats/Impl/ConstantExpressionTemplate.cpp
     Formats/Impl/CSVRowInputFormat.cpp
     Formats/Impl/CSVRowOutputFormat.cpp
-    Formats/Impl/LineAsStringRowInputFormat.cpp
     Formats/Impl/JSONAsStringRowInputFormat.cpp
     Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
     Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
@@ -34,6 +33,7 @@ SRCS(
     Formats/Impl/JSONEachRowRowOutputFormat.cpp
     Formats/Impl/JSONEachRowWithProgressRowOutputFormat.cpp
     Formats/Impl/JSONRowOutputFormat.cpp
+    Formats/Impl/LineAsStringRowInputFormat.cpp
     Formats/Impl/MarkdownRowOutputFormat.cpp
     Formats/Impl/MsgPackRowInputFormat.cpp
     Formats/Impl/MsgPackRowOutputFormat.cpp

From 4e197cf069c18cafb55b5fa22499483d8f19666d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Thu, 10 Sep 2020 19:41:46 +0300
Subject: [PATCH 118/341] Remove unused headers

---
 base/common/types.h | 2 --
 1 file changed, 2 deletions(-)

diff --git a/base/common/types.h b/base/common/types.h
index 682fe94366c..a02398a3365 100644
--- a/base/common/types.h
+++ b/base/common/types.h
@@ -1,8 +1,6 @@
 #pragma once
 
-#include <algorithm>
 #include <cstdint>
-#include <cstdlib>
 #include <string>
 #include <type_traits>
 

From 45340c701dc517b29db5a1047c306f88ba891722 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Thu, 10 Sep 2020 19:49:57 +0300
Subject: [PATCH 119/341] changelog for 20.8

---
 CHANGELOG.md                              | 148 ++++++++++++++++++++++
 utils/simple-backport/backport.sh         |   7 +-
 utils/simple-backport/format-changelog.py |   2 +-
 3 files changed, 154 insertions(+), 3 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 345ee2c6213..f3266520eb1 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,3 +1,151 @@
+## ClickHouse release 20.8
+
+### ClickHouse release v20.8.2.3-stable, 2020-09-08
+
+#### Backward Incompatible Change
+
+* Now `OPTIMIZE FINAL` query doesn't recalculate TTL for parts that were added before TTL was created. Use `ALTER TABLE ... MATERIALIZE TTL` once to calculate them, after that `OPTIMIZE FINAL` will evaluate TTL's properly. This behavior never worked for replicated tables. [#14220](https://github.com/ClickHouse/ClickHouse/pull/14220) ([alesapin](https://github.com/alesapin)).
+* Extend `parallel_distributed_insert_select` setting, adding an option to run `INSERT` into local table. The setting changes type from `Bool` to `UInt64`, so the values `false` and `true` are no longer supported. If you have these values in server configuration, the server will not start. Please replace them with `0` and `1`, respectively. [#14060](https://github.com/ClickHouse/ClickHouse/pull/14060) ([Azat Khuzhin](https://github.com/azat)).
+* Remove support for the `ODBCDriver` input/output format. This was a deprecated format once used for communication with the ClickHouse ODBC driver, now long superseded by the `ODBCDriver2` format. Resolves [#13629](https://github.com/ClickHouse/ClickHouse/issues/13629). [#13847](https://github.com/ClickHouse/ClickHouse/pull/13847) ([hexiaoting](https://github.com/hexiaoting)).
+
+#### New Feature
+
+* Add `countDigits(x)` function that count number of decimal digits in integer or decimal column. Add `isDecimalOverflow(d, [p])` function that checks if the value in Decimal column is out of its (or specified) precision. [#14151](https://github.com/ClickHouse/ClickHouse/pull/14151) ([Artem Zuikov](https://github.com/4ertus2)).
+* Add setting `min_index_granularity_bytes` that protects against accidentally creating a table with very low `index_granularity_bytes` setting. [#14139](https://github.com/ClickHouse/ClickHouse/pull/14139) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add the ability to specify `Default` compression codec for columns that correspond to settings specified in `config.xml`. Implements: [#9074](https://github.com/ClickHouse/ClickHouse/issues/9074). [#14049](https://github.com/ClickHouse/ClickHouse/pull/14049) ([alesapin](https://github.com/alesapin)).
+* Added `date_trunc` function that truncates a date/time value to a specified date/time part. [#13888](https://github.com/ClickHouse/ClickHouse/pull/13888) ([Vladimir Golovchenko](https://github.com/vladimir-golovchenko)).
+* Add `time_zones` table. [#13880](https://github.com/ClickHouse/ClickHouse/pull/13880) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add function `defaultValueOfTypeName` that returns the default value for a given type. [#13877](https://github.com/ClickHouse/ClickHouse/pull/13877) ([hcz](https://github.com/hczhcz)).
+* Add `quantileExactLow` and `quantileExactHigh` implementations with respective aliases for `medianExactLow` and `medianExactHigh`. [#13818](https://github.com/ClickHouse/ClickHouse/pull/13818) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add function `normalizeQuery` that replaces literals, sequences of literals and complex aliases with placeholders. Add function `normalizedQueryHash` that returns identical 64bit hash values for similar queries. It helps to analyze query log. This closes [#11271](https://github.com/ClickHouse/ClickHouse/issues/11271). [#13816](https://github.com/ClickHouse/ClickHouse/pull/13816) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Add new optional section <user_directories> to the main config. [#13425](https://github.com/ClickHouse/ClickHouse/pull/13425) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Add `ALTER SAMPLE BY` statement that allows to change table sample clause. [#13280](https://github.com/ClickHouse/ClickHouse/pull/13280) ([Amos Bird](https://github.com/amosbird)).
+* Function `position` now supports optional `start_pos` argument. [#13237](https://github.com/ClickHouse/ClickHouse/pull/13237) ([vdimir](https://github.com/vdimir)).
+* Add types `Int128`, `Int256`, `UInt256` and related functions for them. Extend Decimals with Decimal256 (precision up to 76 digits). New types are under the setting `allow_experimental_bigint_types`. [#13097](https://github.com/ClickHouse/ClickHouse/pull/13097) ([Artem Zuikov](https://github.com/4ertus2)).
+* Support Kerberos authentication in Kafka, using `krb5` and `cyrus-sasl` libraries. [#12771](https://github.com/ClickHouse/ClickHouse/pull/12771) ([Ilya Golshtein](https://github.com/ilejn)).
+* Support `MaterializeMySQL` database engine. Implements [#4006](https://github.com/ClickHouse/ClickHouse/issues/4006). [#10851](https://github.com/ClickHouse/ClickHouse/pull/10851) ([Winter Zhang](https://github.com/zhang2014)).
+
+#### Bug Fix
+
+* Check for array size overflow in `topK` aggregate function. Without this check the user may send a query with carefully crafter parameters that will lead to server crash. This closes [#14452](https://github.com/ClickHouse/ClickHouse/issues/14452). [#14467](https://github.com/ClickHouse/ClickHouse/pull/14467) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fix bug which leads to wrong merges assignment if table has partitions with a single part. [#14444](https://github.com/ClickHouse/ClickHouse/pull/14444) ([alesapin](https://github.com/alesapin)).
+* Stop query execution if exception happened in `PipelineExecutor` itself. This could prevent rare possible query hung. Continuation of [#14334](https://github.com/ClickHouse/ClickHouse/issues/14334). [#14402](https://github.com/ClickHouse/ClickHouse/pull/14402) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Stop query execution if exception happened in `PipelineExecutor` itself. This could prevent rare possible query hung. [#14334](https://github.com/ClickHouse/ClickHouse/pull/14334) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix crash during `ALTER` query for table which was created `AS table_function`. Fixes [#14212](https://github.com/ClickHouse/ClickHouse/issues/14212). [#14326](https://github.com/ClickHouse/ClickHouse/pull/14326) ([alesapin](https://github.com/alesapin)).
+* Fix exception during ALTER LIVE VIEW query with REFRESH command. [#14320](https://github.com/ClickHouse/ClickHouse/pull/14320) ([Bharat Nallan](https://github.com/bharatnc)).
+* Fix QueryPlan lifetime (for EXPLAIN PIPELINE graph=1) for queries with nested interpreter. [#14315](https://github.com/ClickHouse/ClickHouse/pull/14315) ([Azat Khuzhin](https://github.com/azat)).
+* Fix segfault in `clickhouse-odbc-bridge` during schema fetch from some external sources. This PR fixes https://github.com/ClickHouse/ClickHouse/issues/13861. [#14267](https://github.com/ClickHouse/ClickHouse/pull/14267) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Disallows `CODEC` on `ALIAS` column type. Fixes [#13911](https://github.com/ClickHouse/ClickHouse/issues/13911). [#14263](https://github.com/ClickHouse/ClickHouse/pull/14263) ([Bharat Nallan](https://github.com/bharatnc)).
+* Fix handling of empty transactions in `MaterializeMySQL` database engine. This fixes [#14235](https://github.com/ClickHouse/ClickHouse/issues/14235). [#14253](https://github.com/ClickHouse/ClickHouse/pull/14253) ([BohuTANG](https://github.com/BohuTANG)).
+* fixes [#14231](https://github.com/ClickHouse/ClickHouse/issues/14231) fix wrong lexer in MaterializeMySQL database engine dump stage. [#14232](https://github.com/ClickHouse/ClickHouse/pull/14232) ([Winter Zhang](https://github.com/zhang2014)).
+* Fix crash in mark inclusion search introduced in https://github.com/ClickHouse/ClickHouse/pull/12277 . [#14225](https://github.com/ClickHouse/ClickHouse/pull/14225) ([Amos Bird](https://github.com/amosbird)).
+* Fixed incorrect sorting order if LowCardinality column. This fixes [#13958](https://github.com/ClickHouse/ClickHouse/issues/13958). [#14223](https://github.com/ClickHouse/ClickHouse/pull/14223) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix creation of tables with named tuples. This fixes [#13027](https://github.com/ClickHouse/ClickHouse/issues/13027). [#14143](https://github.com/ClickHouse/ClickHouse/pull/14143) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fix formatting of minimal negative decimal numbers. This fixes https://github.com/ClickHouse/ClickHouse/issues/14111. [#14119](https://github.com/ClickHouse/ClickHouse/pull/14119) ([Alexander Kuzmenkov](https://github.com/akuzm)).
+* When waiting for a dictionary update to complete, use the timeout specified by `query_wait_timeout_milliseconds` setting instead of a hard-coded value. [#14105](https://github.com/ClickHouse/ClickHouse/pull/14105) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix DistributedFilesToInsert metric (zeroed when it should not). [#14095](https://github.com/ClickHouse/ClickHouse/pull/14095) ([Azat Khuzhin](https://github.com/azat)).
+* Fix pointInPolygon with const 2d array as polygon. [#14079](https://github.com/ClickHouse/ClickHouse/pull/14079) ([Alexey Ilyukhov](https://github.com/livace)).
+* Fixed wrong mount point in extra info for `Poco::Exception: no space left on device`. [#14050](https://github.com/ClickHouse/ClickHouse/pull/14050) ([tavplubix](https://github.com/tavplubix)).
+* Fix GRANT ALL statement when executed on a non-global level. [#13987](https://github.com/ClickHouse/ClickHouse/pull/13987) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix parser to reject create table as table function with engine. [#13940](https://github.com/ClickHouse/ClickHouse/pull/13940) ([hcz](https://github.com/hczhcz)).
+* Fix wrong results in select queries with `DISTINCT` keyword in case `optimize_duplicate_order_by_and_distinct` setting is enabled. [#13925](https://github.com/ClickHouse/ClickHouse/pull/13925) ([Artem Zuikov](https://github.com/4ertus2)).
+* Fixed potential deadlock when renaming `Distributed` table. [#13922](https://github.com/ClickHouse/ClickHouse/pull/13922) ([tavplubix](https://github.com/tavplubix)).
+* Fix incorrect sorting for `FixedString` columns. Fixes [#13182](https://github.com/ClickHouse/ClickHouse/issues/13182). [#13887](https://github.com/ClickHouse/ClickHouse/pull/13887) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix topK/topKWeighted merge (with non-default parameters). [#13817](https://github.com/ClickHouse/ClickHouse/pull/13817) ([Azat Khuzhin](https://github.com/azat)).
+* Fix reading from MergeTree table with INDEX of type SET fails when comparing against NULL. This fixes [#13686](https://github.com/ClickHouse/ClickHouse/issues/13686). [#13793](https://github.com/ClickHouse/ClickHouse/pull/13793) ([Amos Bird](https://github.com/amosbird)).
+* Fix arrayJoin() capturing in lambda (LOGICAL_ERROR). [#13792](https://github.com/ClickHouse/ClickHouse/pull/13792) ([Azat Khuzhin](https://github.com/azat)).
+* Fix step overflow in range(). [#13790](https://github.com/ClickHouse/ClickHouse/pull/13790) ([Azat Khuzhin](https://github.com/azat)).
+* Fixed `Directory not empty` error when concurrently executing `DROP DATABASE` and `CREATE TABLE`. [#13756](https://github.com/ClickHouse/ClickHouse/pull/13756) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Add range check for h3KRing function. This fixes [#13633](https://github.com/ClickHouse/ClickHouse/issues/13633). [#13752](https://github.com/ClickHouse/ClickHouse/pull/13752) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fix race condition between DETACH and background merges. Parts may revive after detach. This is continuation of [#8602](https://github.com/ClickHouse/ClickHouse/issues/8602) that did not fix the issue but introduced a test that started to fail in very rare cases, demonstrating the issue. [#13746](https://github.com/ClickHouse/ClickHouse/pull/13746) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fix logging Settings.Names/Values when log_queries_min_type > QUERY_START. [#13737](https://github.com/ClickHouse/ClickHouse/pull/13737) ([Azat Khuzhin](https://github.com/azat)).
+* Fixes /replicas_status endpoint response status code when verbose=1. [#13722](https://github.com/ClickHouse/ClickHouse/pull/13722) ([javi santana](https://github.com/javisantana)).
+* Fix incorrect message in `clickhouse-server.init` while checking user and group. [#13711](https://github.com/ClickHouse/ClickHouse/pull/13711) ([ylchou](https://github.com/ylchou)).
+* Fix visible data clobbering by progress bar in client in interactive mode. This fixes [#12562](https://github.com/ClickHouse/ClickHouse/issues/12562) and [#13369](https://github.com/ClickHouse/ClickHouse/issues/13369) and [#13584](https://github.com/ClickHouse/ClickHouse/issues/13584) and fixes [#12964](https://github.com/ClickHouse/ClickHouse/issues/12964). [#13691](https://github.com/ClickHouse/ClickHouse/pull/13691) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Do not optimize any(arrayJoin()) -> arrayJoin() under optimize_move_functions_out_of_any. [#13681](https://github.com/ClickHouse/ClickHouse/pull/13681) ([Azat Khuzhin](https://github.com/azat)).
+* Fix crash in JOIN with StorageMerge and `set enable_optimize_predicate_expression=1`. [#13679](https://github.com/ClickHouse/ClickHouse/pull/13679) ([Artem Zuikov](https://github.com/4ertus2)).
+* Fix typo in error message about `The value of 'number_of_free_entries_in_pool_to_lower_max_size_of_merge' setting`. [#13678](https://github.com/ClickHouse/ClickHouse/pull/13678) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Concurrent `ALTER ... REPLACE/MOVE PARTITION ...` queries might cause deadlock. It's fixed. [#13626](https://github.com/ClickHouse/ClickHouse/pull/13626) ([tavplubix](https://github.com/tavplubix)).
+* Fixed the behaviour when sometimes cache-dictionary returned default value instead of present value from source. [#13624](https://github.com/ClickHouse/ClickHouse/pull/13624) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix secondary indices corruption in compact parts. [#13538](https://github.com/ClickHouse/ClickHouse/pull/13538) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix premature `ON CLUSTER` timeouts for queries that must be executed on a single replica. Fixes [#6704](https://github.com/ClickHouse/ClickHouse/issues/6704), [#7228](https://github.com/ClickHouse/ClickHouse/issues/7228), [#13361](https://github.com/ClickHouse/ClickHouse/issues/13361), [#11884](https://github.com/ClickHouse/ClickHouse/issues/11884). [#13450](https://github.com/ClickHouse/ClickHouse/pull/13450) ([alesapin](https://github.com/alesapin)).
+* Fix wrong code in function `netloc`. This fixes [#13335](https://github.com/ClickHouse/ClickHouse/issues/13335). [#13446](https://github.com/ClickHouse/ClickHouse/pull/13446) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fix possible race in `StorageMemory`. https://clickhouse-test-reports.s3.yandex.net/0/9cac8a7244063d2092ad25d45502611e18d3749c/stress_test_(thread)/stderr.log Have no idea how to write a test. [#13416](https://github.com/ClickHouse/ClickHouse/pull/13416) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix missing or excessive headers in `TSV/CSVWithNames` formats. This fixes [#12504](https://github.com/ClickHouse/ClickHouse/issues/12504). [#13343](https://github.com/ClickHouse/ClickHouse/pull/13343) ([Azat Khuzhin](https://github.com/azat)).
+* Fix parsing row policies from users.xml when names of databases or tables contain dots. This fixes https://github.com/ClickHouse/ClickHouse/issues/5779, https://github.com/ClickHouse/ClickHouse/issues/12527. [#13199](https://github.com/ClickHouse/ClickHouse/pull/13199) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix access to redis dictionary after connection was dropped once. It may happen with `cache` and `direct` dictionary layouts. [#13082](https://github.com/ClickHouse/ClickHouse/pull/13082) ([Anton Popov](https://github.com/CurtizJ)).
+* Removed wrong auth access check when using ClickHouseDictionarySource to query remote tables. [#12756](https://github.com/ClickHouse/ClickHouse/pull/12756) ([sundyli](https://github.com/sundy-li)).
+* subquery hash values are not enough to distinguish. https://github.com/ClickHouse/ClickHouse/issues/8333. [#8367](https://github.com/ClickHouse/ClickHouse/pull/8367) ([Amos Bird](https://github.com/amosbird)).
+
+#### Improvement
+
+* Now it's possible to `ALTER TABLE table_name FETCH PARTITION partition_expr FROM 'zk://<host>:<port>/path-in-zookeeper'`. It's useful for shipping data to new clusters. [#14155](https://github.com/ClickHouse/ClickHouse/pull/14155) ([Amos Bird](https://github.com/amosbird)).
+* Slightly better performance of Memory table if it was constructed from a huge number of very small blocks (that's unlikely). Author of the idea: [Mark Papadakis](https://github.com/markpapadakis). Closes [#14043](https://github.com/ClickHouse/ClickHouse/issues/14043). [#14056](https://github.com/ClickHouse/ClickHouse/pull/14056) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Conditional aggregate functions (for example: `avgIf`, `sumIf`, `maxIf`) should return `NULL` when miss rows and use nullable arguments. [#13964](https://github.com/ClickHouse/ClickHouse/pull/13964) ([Winter Zhang](https://github.com/zhang2014)).
+* Increase limit in -Resample combinator to 1M. [#13947](https://github.com/ClickHouse/ClickHouse/pull/13947) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Corrected an error in AvroConfluent format that caused the Kafka table engine to stop processing messages when an abnormally small, malformed, message was received. [#13941](https://github.com/ClickHouse/ClickHouse/pull/13941) ([Gervasio Varela](https://github.com/gervarela)).
+* Fix wrong error for long queries. It was possible to get syntax error other than `Max query size exceeded` for correct query. [#13928](https://github.com/ClickHouse/ClickHouse/pull/13928) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Better error message for null value of TabSeparatedRow format. [#13906](https://github.com/ClickHouse/ClickHouse/pull/13906) ([jiang tao](https://github.com/tomjiang1987)).
+* Function `arrayCompact` will compare NaNs bitwise if the type of array elements is Float32/Float64. In previous versions NaNs were always not equal if the type of array elements is Float32/Float64 and were always equal if the type is more complex, like Nullable(Float64). This closes [#13857](https://github.com/ClickHouse/ClickHouse/issues/13857). [#13868](https://github.com/ClickHouse/ClickHouse/pull/13868) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fix data race in `lgamma` function. This race was caught only in `tsan`, no side effects a really happened. [#13842](https://github.com/ClickHouse/ClickHouse/pull/13842) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* 1. Add [GTID-Based Replication](https://dev.mysql.com/doc/refman/5.7/en/replication-gtids-concepts.html), it works even when replication topology changes, and supported/prefered in MySQL 5.6/5.7/8.0 2. Add BIT/SET filed type supports 3. Fix up varchar type meta length bug. [#13820](https://github.com/ClickHouse/ClickHouse/pull/13820) ([BohuTANG](https://github.com/BohuTANG)).
+* Avoid too slow queries when arrays are manipulated as fields. Throw exception instead. [#13753](https://github.com/ClickHouse/ClickHouse/pull/13753) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Added Redis requirepass authorization. [#13688](https://github.com/ClickHouse/ClickHouse/pull/13688) ([Ivan Torgashov](https://github.com/it1804)).
+* Add MergeTree Write-Ahead-Log(WAL) dump tool. [#13640](https://github.com/ClickHouse/ClickHouse/pull/13640) ([BohuTANG](https://github.com/BohuTANG)).
+* In previous versions `lcm` function may produce assertion violation in debug build if called with specifically crafted arguments. This fixes [#13368](https://github.com/ClickHouse/ClickHouse/issues/13368). [#13510](https://github.com/ClickHouse/ClickHouse/pull/13510) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Provide monotonicity for `toDate/toDateTime` functions in more cases. Now the input arguments are saturated more naturally and provides better monotonicity. [#13497](https://github.com/ClickHouse/ClickHouse/pull/13497) ([Amos Bird](https://github.com/amosbird)).
+* Support compound identifiers for custom settings. [#13496](https://github.com/ClickHouse/ClickHouse/pull/13496) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Move parts from DIskLocal to DiskS3 in parallel. [#13459](https://github.com/ClickHouse/ClickHouse/pull/13459) ([Pavel Kovalenko](https://github.com/Jokser)).
+* Enable mixed granularity parts by default. [#13449](https://github.com/ClickHouse/ClickHouse/pull/13449) ([alesapin](https://github.com/alesapin)).
+* Proper remote host checking in S3 redirects (security-related thing). [#13404](https://github.com/ClickHouse/ClickHouse/pull/13404) ([Vladimir Chebotarev](https://github.com/excitoon)).
+* Add QueryTimeMicroseconds, SelectQueryTimeMicroseconds and InsertQueryTimeMicroseconds to system.events. [#13336](https://github.com/ClickHouse/ClickHouse/pull/13336) ([ianton-ru](https://github.com/ianton-ru)).
+* Fix assert when decimal has too large negative exponent. Fixes [#13188](https://github.com/ClickHouse/ClickHouse/issues/13188). [#13228](https://github.com/ClickHouse/ClickHouse/pull/13228) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Added cache layer for DiskS3 (cache to local disk mark and index files). [#13076](https://github.com/ClickHouse/ClickHouse/pull/13076) ([Pavel Kovalenko](https://github.com/Jokser)).
+
+#### Performance Improvement
+
+* Slightly optimize very short queries with LowCardinality. [#14129](https://github.com/ClickHouse/ClickHouse/pull/14129) ([Anton Popov](https://github.com/CurtizJ)).
+* Enable parallel INSERTs for table engines `Null`, `Memory`, `Distributed` and `Buffer`. [#14120](https://github.com/ClickHouse/ClickHouse/pull/14120) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fail fast if `max_rows_to_read` limit is exceeded on parts scan. The motivation behind this change is to skip ranges scan for all selected parts if it is clear that `max_rows_to_read` is already exceeded. The change is quite noticeable for queries over big number of parts. [#13677](https://github.com/ClickHouse/ClickHouse/pull/13677) ([Roman Khavronenko](https://github.com/hagen1778)).
+* Slightly improve performance of aggregation by UInt8/UInt16 keys. [#13099](https://github.com/ClickHouse/ClickHouse/pull/13099) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Optimize `has()`, `indexOf()` and `countEqual()` functions for `Array(LowCardinality(T))` and constant right arguments. [#12550](https://github.com/ClickHouse/ClickHouse/pull/12550) ([myrrc](https://github.com/myrrc)).
+* When performing trivial `INSERT SELECT` queries, automatically set `max_threads` to 1 or `max_insert_threads`, and set `max_block_size` to `min_insert_block_size_rows`. Related to [#5907](https://github.com/ClickHouse/ClickHouse/issues/5907). [#12195](https://github.com/ClickHouse/ClickHouse/pull/12195) ([flynn](https://github.com/ucasFL)).
+
+#### Build/Testing/Packaging Improvement
+
+* Actually there are no symlinks there, so `-type f` is enough ``` ~/workspace/ClickHouse/contrib/cctz/testdata/zoneinfo$ find . -type l -ls | wc -l 0 ``` Closes [#14209](https://github.com/ClickHouse/ClickHouse/issues/14209). [#14215](https://github.com/ClickHouse/ClickHouse/pull/14215) ([filimonov](https://github.com/filimonov)).
+* Switch tests docker images to use test-base parent. [#14167](https://github.com/ClickHouse/ClickHouse/pull/14167) ([Ilya Yatsishin](https://github.com/qoega)).
+* Add the ability to write js-style comments in skip_list.json. [#14159](https://github.com/ClickHouse/ClickHouse/pull/14159) ([alesapin](https://github.com/alesapin)).
+* * Adding retry logic when bringing up docker-compose cluster * Increasing COMPOSE_HTTP_TIMEOUT. [#14112](https://github.com/ClickHouse/ClickHouse/pull/14112) ([vzakaznikov](https://github.com/vzakaznikov)).
+* Enabled text-log in stress test to find more bugs. [#13855](https://github.com/ClickHouse/ClickHouse/pull/13855) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Testflows LDAP module: adding missing certificates and dhparam.pem for openldap4. [#13780](https://github.com/ClickHouse/ClickHouse/pull/13780) ([vzakaznikov](https://github.com/vzakaznikov)).
+* ZooKeeper cannot work reliably in unit tests in CI infrastructure. Using unit tests for ZooKeeper interaction with real ZooKeeper is bad idea from the start (unit tests are not supposed to verify complex distributed systems). We already using integration tests for this purpose and they are better suited. [#13745](https://github.com/ClickHouse/ClickHouse/pull/13745) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Added docker image for style check. Added style check that all docker and docker compose files are located in docker directory. [#13724](https://github.com/ClickHouse/ClickHouse/pull/13724) ([Ilya Yatsishin](https://github.com/qoega)).
+* FIx cassandra build on Mac OS. [#13708](https://github.com/ClickHouse/ClickHouse/pull/13708) ([Ilya Yatsishin](https://github.com/qoega)).
+* Fix link error in shared build. [#13700](https://github.com/ClickHouse/ClickHouse/pull/13700) ([Amos Bird](https://github.com/amosbird)).
+* Add a CMake option to fail configuration instead of auto-reconfiguration, enabled by default. [#13687](https://github.com/ClickHouse/ClickHouse/pull/13687) ([Konstantin](https://github.com/podshumok)).
+* Updating LDAP user authentication suite to check that it works with RBAC. [#13656](https://github.com/ClickHouse/ClickHouse/pull/13656) ([vzakaznikov](https://github.com/vzakaznikov)).
+* Expose version of embedded tzdata via TZDATA_VERSION in system.build_options. [#13648](https://github.com/ClickHouse/ClickHouse/pull/13648) ([filimonov](https://github.com/filimonov)).
+* Removed `-DENABLE_CURL_CLIENT` for `contrib/aws`. [#13628](https://github.com/ClickHouse/ClickHouse/pull/13628) ([Vladimir Chebotarev](https://github.com/excitoon)).
+* Build ClickHouse with the most fresh tzdata from package repository. [#13623](https://github.com/ClickHouse/ClickHouse/pull/13623) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Increasing health-check timeouts for ClickHouse nodes and adding support to dump docker-compose logs if unhealthy containers found. [#13612](https://github.com/ClickHouse/ClickHouse/pull/13612) ([vzakaznikov](https://github.com/vzakaznikov)).
+* Make sure https://github.com/ClickHouse/ClickHouse/issues/10977 is invalid. [#13539](https://github.com/ClickHouse/ClickHouse/pull/13539) ([Amos Bird](https://github.com/amosbird)).
+* Enable Shellcheck in CI as a linter of .sh tests. This closes [#13168](https://github.com/ClickHouse/ClickHouse/issues/13168). [#13530](https://github.com/ClickHouse/ClickHouse/pull/13530) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fix the remaining shellcheck notices. A preparation to enable Shellcheck. [#13529](https://github.com/ClickHouse/ClickHouse/pull/13529) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Added `clickhouse install` script, that is useful if you only have a single binary. [#13528](https://github.com/ClickHouse/ClickHouse/pull/13528) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Allow to run `clickhouse` binary without configuration. [#13515](https://github.com/ClickHouse/ClickHouse/pull/13515) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Ensure that there is no copy-pasted GPL code. [#13514](https://github.com/ClickHouse/ClickHouse/pull/13514) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Enable check for typos in code with `codespell`. [#13513](https://github.com/ClickHouse/ClickHouse/pull/13513) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fix typos in code with codespell. [#13511](https://github.com/ClickHouse/ClickHouse/pull/13511) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Skip PR's from robot-clickhouse. [#13489](https://github.com/ClickHouse/ClickHouse/pull/13489) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Move Dockerfiles from integration tests to `docker/test` directory. docker_compose files are available in `runner` docker container. Docker images are built in CI and not in integration tests. [#13448](https://github.com/ClickHouse/ClickHouse/pull/13448) ([Ilya Yatsishin](https://github.com/qoega)).
+
+#### Other
+
+* Create `system` database with `Atomic` engine by default. [#13680](https://github.com/ClickHouse/ClickHouse/pull/13680) ([tavplubix](https://github.com/tavplubix)).
+* Fix readline so it dumps history to file now. [#13600](https://github.com/ClickHouse/ClickHouse/pull/13600) ([Amos Bird](https://github.com/amosbird)).
+
+
 ## ClickHouse release 20.7
 
 ### ClickHouse release v20.7.2.30-stable, 2020-08-31
diff --git a/utils/simple-backport/backport.sh b/utils/simple-backport/backport.sh
index 71920304d56..64f8e6004bf 100755
--- a/utils/simple-backport/backport.sh
+++ b/utils/simple-backport/backport.sh
@@ -4,7 +4,10 @@ set -e
 branch="$1"
 merge_base=$(git merge-base origin/master "origin/$branch")
 master_git_cmd=(git log "$merge_base..origin/master" --first-parent)
-branch_git_cmd=(git log "$merge_base..origin/$branch" --first-parent)
+# The history in back branches shouldn't be too crazy, and sometimes we have a PR
+# that merges several backport commits there (3f2cba6824fddf31c30bde8c6f4f860572f4f580),
+# so don't use --first-parent
+branch_git_cmd=(git log "$merge_base..origin/$branch")
 
 # Make lists of PRs that were merged into each branch. Use first parent here, or else
 # we'll get weird things like seeing older master that was merged into a PR branch
@@ -30,7 +33,7 @@ fi
 # Search for PR numbers in commit messages. First variant is normal merge, and second
 # variant is squashed. Next are some backport message variants.
 find_prs=(sed -n "s/^.*merg[eding]*.*#\([[:digit:]]\+\).*$/\1/Ip;
-                  s/^.*(#\([[:digit:]]\+\))$/\1/p;
+                  s/^.*#\([[:digit:]]\+\))$/\1/p;
                   s/^.*back[- ]*port[ed of]*.*#\([[:digit:]]\+\).*$/\1/Ip;
                   s/^.*cherry[- ]*pick[ed of]*.*#\([[:digit:]]\+\).*$/\1/Ip")
 
diff --git a/utils/simple-backport/format-changelog.py b/utils/simple-backport/format-changelog.py
index ccda88c6809..5dff4f1c5e8 100755
--- a/utils/simple-backport/format-changelog.py
+++ b/utils/simple-backport/format-changelog.py
@@ -93,7 +93,7 @@ for line in args.file:
 
     # Normalize category name
     for c in categories_preferred_order:
-        if fuzzywuzzy.fuzz.ratio(pr['category'], c) >= 90:
+        if fuzzywuzzy.fuzz.ratio(pr['category'].lower(), c.lower()) >= 90:
             pr['category'] = c
             break
 

From 142026f4abc810426d4ebf195bb8316a83b6adff Mon Sep 17 00:00:00 2001
From: Artem Hnilov <boobsd@gmail.com>
Date: Thu, 10 Sep 2020 16:54:52 +0000
Subject: [PATCH 120/341] 01492_format_readable_quantity test added

---
 .../01492_format_readable_quantity.reference  | 50 +++++++++++++++++++
 .../01492_format_readable_quantity.sql        |  4 ++
 2 files changed, 54 insertions(+)
 create mode 100644 tests/queries/0_stateless/01492_format_readable_quantity.reference
 create mode 100644 tests/queries/0_stateless/01492_format_readable_quantity.sql

diff --git a/tests/queries/0_stateless/01492_format_readable_quantity.reference b/tests/queries/0_stateless/01492_format_readable_quantity.reference
new file mode 100644
index 00000000000..3736933b5ee
--- /dev/null
+++ b/tests/queries/0_stateless/01492_format_readable_quantity.reference
@@ -0,0 +1,50 @@
+1.00	1.00	1.00
+2.72	2.00	2.00
+7.39	7.00	7.00
+20.09	20.00	20.00
+54.60	54.00	54.00
+148.41	148.00	148.00
+403.43	403.00	403.00
+1.10 thousand	1.10 thousand	1.10 thousand
+2.98 thousand	2.98 thousand	2.98 thousand
+8.10 thousand	8.10 thousand	8.10 thousand
+22.03 thousand	22.03 thousand	22.03 thousand
+59.87 thousand	59.87 thousand	59.87 thousand
+162.75 thousand	162.75 thousand	162.75 thousand
+442.41 thousand	442.41 thousand	442.41 thousand
+1.20 million	1.20 million	1.20 million
+3.27 million	3.27 million	3.27 million
+8.89 million	8.89 million	8.89 million
+24.15 million	24.15 million	24.15 million
+65.66 million	65.66 million	65.66 million
+178.48 million	178.48 million	178.48 million
+485.17 million	485.17 million	485.17 million
+1.32 billion	1.32 billion	1.32 billion
+3.58 billion	3.58 billion	-2.15 billion
+9.74 billion	9.74 billion	-2.15 billion
+26.49 billion	26.49 billion	-2.15 billion
+72.00 billion	72.00 billion	-2.15 billion
+195.73 billion	195.73 billion	-2.15 billion
+532.05 billion	532.05 billion	-2.15 billion
+1.45 trillion	1.45 trillion	-2.15 billion
+3.93 trillion	3.93 trillion	-2.15 billion
+10.69 trillion	10.69 trillion	-2.15 billion
+29.05 trillion	29.05 trillion	-2.15 billion
+78.96 trillion	78.96 trillion	-2.15 billion
+214.64 trillion	214.64 trillion	-2.15 billion
+583.46 trillion	583.46 trillion	-2.15 billion
+1.59 quadrillion	1.59 quadrillion	-2.15 billion
+4.31 quadrillion	4.31 quadrillion	-2.15 billion
+11.72 quadrillion	11.72 quadrillion	-2.15 billion
+31.86 quadrillion	31.86 quadrillion	-2.15 billion
+86.59 quadrillion	86.59 quadrillion	-2.15 billion
+235.39 quadrillion	235.39 quadrillion	-2.15 billion
+639.84 quadrillion	639.84 quadrillion	-2.15 billion
+1739.27 quadrillion	1739.27 quadrillion	-2.15 billion
+4727.84 quadrillion	4727.84 quadrillion	-2.15 billion
+12851.60 quadrillion	12851.60 quadrillion	-2.15 billion
+34934.27 quadrillion	0.00	-2.15 billion
+94961.19 quadrillion	0.00	-2.15 billion
+258131.29 quadrillion	0.00	-2.15 billion
+701673.59 quadrillion	0.00	-2.15 billion
+1907346.57 quadrillion	0.00	-2.15 billion
diff --git a/tests/queries/0_stateless/01492_format_readable_quantity.sql b/tests/queries/0_stateless/01492_format_readable_quantity.sql
new file mode 100644
index 00000000000..c2ebcfc1a97
--- /dev/null
+++ b/tests/queries/0_stateless/01492_format_readable_quantity.sql
@@ -0,0 +1,4 @@
+WITH round(exp(number), 6) AS x, toUInt64(x) AS y, toInt32(x) AS z
+SELECT formatReadableQuantity(x), formatReadableQuantity(y), formatReadableQuantity(z)
+FROM system.numbers
+LIMIT 50;

From 8689797efc4d749f4cda139818b1a94caccfe628 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Thu, 10 Sep 2020 19:57:26 +0300
Subject: [PATCH 121/341] Run only some queries in perf tests, not all combos

---
 docker/test/performance-comparison/compare.sh | 17 ++++++++++++++++-
 docker/test/performance-comparison/perf.py    | 12 ++++++++++--
 2 files changed, 26 insertions(+), 3 deletions(-)

diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index 364e9994ab7..0b678024765 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -121,7 +121,7 @@ function run_tests
     then
         # Use the explicitly set path to directory with test files.
         test_prefix="$CHPC_TEST_PATH"
-    elif [ "$PR_TO_TEST" = "0" ]
+    elif [ "$PR_TO_TEST" == "0" ]
     then
         # When testing commits from master, use the older test files. This
         # allows the tests to pass even when we add new functions and tests for
@@ -155,6 +155,20 @@ function run_tests
         test_files=$(ls "$test_prefix"/*.xml)
     fi
 
+    # For PRs, test only a subset of queries, and run them less times.
+    # If the corresponding environment variables are already set, keep
+    # those values.
+    if [ "$PR_TO_TEST" == "0" ]
+    then
+        CHPC_TEST_RUNS=${CHPC_RUNS:-7}
+        CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-15}
+    else
+        CHPC_TEST_RUNS=${CHPC_RUNS:-13}
+        CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-0}
+    fi
+    export CHPC_TEST_RUNS
+    export CHPC_MAX_QUERIES
+
     # Determine which concurrent benchmarks to run. For now, the only test
     # we run as a concurrent benchmark is 'website'. Run it as benchmark if we
     # are also going to run it as a normal test.
@@ -187,6 +201,7 @@ function run_tests
         # the grep is to filter out set -x output and keep only time output
         { \
             time "$script_dir/perf.py" --host localhost localhost --port 9001 9002 \
+                --runs "$CHPC_RUNS" --max-queries "$CHPC_MAX_QUERIES" \
                 -- "$test" > "$test_name-raw.tsv" 2> "$test_name-err.log" ; \
         } 2>&1 >/dev/null | grep -v ^+ >> "wall-clock-times.tsv" \
             || echo "Test $test_name failed with error code $?" >> "$test_name-err.log"
diff --git a/docker/test/performance-comparison/perf.py b/docker/test/performance-comparison/perf.py
index e1476d9aeb4..64314c129b5 100755
--- a/docker/test/performance-comparison/perf.py
+++ b/docker/test/performance-comparison/perf.py
@@ -7,6 +7,7 @@ import clickhouse_driver
 import xml.etree.ElementTree as et
 import argparse
 import pprint
+import random
 import re
 import string
 import time
@@ -20,7 +21,8 @@ parser = argparse.ArgumentParser(description='Run performance test.')
 parser.add_argument('file', metavar='FILE', type=argparse.FileType('r', encoding='utf-8'), nargs=1, help='test description file')
 parser.add_argument('--host', nargs='*', default=['localhost'], help="Server hostname(s). Corresponds to '--port' options.")
 parser.add_argument('--port', nargs='*', default=[9000], help="Server port(s). Corresponds to '--host' options.")
-parser.add_argument('--runs', type=int, default=int(os.environ.get('CHPC_RUNS', 13)), help='Number of query runs per server. Defaults to CHPC_RUNS environment variable.')
+parser.add_argument('--runs', type=int, default=1, help='Number of query runs per server.')
+parser.add_argument('--max-queries', type=int, default=None, help='Test no more than this number of queries, chosen at random.')
 parser.add_argument('--long', action='store_true', help='Do not skip the tests tagged as long.')
 parser.add_argument('--print-queries', action='store_true', help='Print test queries and exit.')
 parser.add_argument('--print-settings', action='store_true', help='Print test settings and exit.')
@@ -189,8 +191,14 @@ for conn_index, c in enumerate(connections):
         c.execute(q)
         print(f'fill\t{conn_index}\t{c.last_query.elapsed}\t{tsv_escape(q)}')
 
+# Run the queries in randomized order, but preserve their indexes as specified
+# in the test XML. To avoid using too much time, limit the number of queries
+# we run per test.
+queries_to_run = random.sample(range(0, len(test_queries)), args.max_queries or len(test_queries))
+
 # Run test queries.
-for query_index, q in enumerate(test_queries):
+for query_index in queries_to_run:
+    q = test_queries[query_index]
     query_prefix = f'{test_name}.query{query_index}'
 
     # We have some crazy long queries (about 100kB), so trim them to a sane

From bbe379d58e96968ae24c7dee5fef9e872aa2f272 Mon Sep 17 00:00:00 2001
From: Artem Hnilov <boobsd@gmail.com>
Date: Thu, 10 Sep 2020 17:06:32 +0000
Subject: [PATCH 122/341] 00534_filimonov.data was updated

---
 tests/queries/0_stateless/00534_filimonov.data | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/00534_filimonov.data b/tests/queries/0_stateless/00534_filimonov.data
index b4c15b01ef4..393ff5b7155 100644
--- a/tests/queries/0_stateless/00534_filimonov.data
+++ b/tests/queries/0_stateless/00534_filimonov.data
@@ -174,6 +174,7 @@ SELECT sipHash64(NULL);
 SELECT protocol(NULL);
 SELECT toInt16OrZero(NULL);
 SELECT formatReadableSize(NULL);
+SELECT formatReadableQuantity(NULL);
 SELECT concatAssumeInjective(NULL);
 SELECT toString(NULL);
 SELECT MACStringToNum(NULL);

From 5675efbd47fde50524463a14758c672091264897 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Thu, 10 Sep 2020 20:16:12 +0300
Subject: [PATCH 123/341] Fix build

---
 src/Common/remapExecutable.cpp | 30 ++++++++++++++----------------
 1 file changed, 14 insertions(+), 16 deletions(-)

diff --git a/src/Common/remapExecutable.cpp b/src/Common/remapExecutable.cpp
index b41fece0c79..6b86e8717a4 100644
--- a/src/Common/remapExecutable.cpp
+++ b/src/Common/remapExecutable.cpp
@@ -89,20 +89,6 @@ __attribute__((__noinline__)) int64_t our_syscall(...)
 }
 
 
-__attribute__((__always_inline__)) void our_memcpy(char * __restrict dst, const char * __restrict src, ssize_t n)
-{
-    while (n > 0)
-    {
-        _mm_storeu_si128(reinterpret_cast<__m128i *>(dst),
-            _mm_loadu_si128(reinterpret_cast<const __m128i *>(src)));
-
-        dst += 16;
-        src += 16;
-        n -= 16;
-    }
-}
-
-
 __attribute__((__noinline__)) void remapToHugeStep3(void * scratch, size_t size, size_t offset)
 {
     /// The function should not use the stack, otherwise various optimizations, including "omit-frame-pointer" may break the code.
@@ -122,7 +108,7 @@ __attribute__((__noinline__)) void remapToHugeStep2(void * begin, size_t size, v
     /** Unmap old memory region with the code of our program.
       * Our instruction pointer is located inside scratch area and this function can execute after old code is unmapped.
       * But it cannot call any other functions because they are not available at usual addresses
-      * - that's why we have to use "our_syscall" and "our_memcpy" functions.
+      * - that's why we have to use "our_syscall" function and a substitution for memcpy.
       * (Relative addressing may continue to work but we should not assume that).
       */
 
@@ -152,7 +138,19 @@ __attribute__((__noinline__)) void remapToHugeStep2(void * begin, size_t size, v
 
     /// Copy the code from scratch area to the old memory location.
 
-    our_memcpy(reinterpret_cast<char *>(begin), reinterpret_cast<const char *>(scratch), size);
+    {
+        __m128i * __restrict dst = reinterpret_cast<__m128i *>(begin);
+        const __m128i * __restrict src = reinterpret_cast<const __m128i *>(scratch);
+        const __m128i * __restrict src_end = reinterpret_cast<const __m128i *>(reinterpret_cast<const char *>(scratch) + size);
+        while (src < src_end)
+        {
+            _mm_storeu_si128(dst, _mm_loadu_si128(src));
+
+            ++dst;
+            ++src;
+        }
+    }
+
     //syscall_func(SYS_write, 2, &dot, 1);
 
     /// Make the memory area with the code executable and non-writable.

From 294af54007b761fbab57f006b4e074f9f996944a Mon Sep 17 00:00:00 2001
From: Artem Hnilov <boobsd@gmail.com>
Date: Thu, 10 Sep 2020 20:27:37 +0300
Subject: [PATCH 124/341] Update other-functions.md

---
 .../functions/other-functions.md              | 23 +++++++++++++++++++
 1 file changed, 23 insertions(+)

diff --git a/docs/ru/sql-reference/functions/other-functions.md b/docs/ru/sql-reference/functions/other-functions.md
index 468e15e7d57..7b9dacf21cd 100644
--- a/docs/ru/sql-reference/functions/other-functions.md
+++ b/docs/ru/sql-reference/functions/other-functions.md
@@ -508,6 +508,29 @@ SELECT
 └────────────────┴────────────┘
 ```
 
+## formatReadableQuantity(x) {#formatreadablequantityx}
+
+Принимает число. Возвращает округленное число с суффиксом (thousand, million, billion и т.д.) в виде строки.
+
+Облегчает визуальное восприятие больших чисел живым человеком.
+
+Пример:
+
+``` sql
+SELECT
+    arrayJoin([1024, 1234 * 1000, (4567 * 1000) * 1000, 98765432101234]) AS number,
+    formatReadableQuantity(number) AS number_for_humans
+```
+
+``` text
+┌─────────number─┬─number_for_humans─┐
+│           1024 │ 1.02 thousand     │
+│        1234000 │ 1.23 million      │
+│     4567000000 │ 4.57 billion      │
+│ 98765432101234 │ 98.77 trillion    │
+└────────────────┴───────────────────┘
+```
+
 ## least(a, b) {#leasta-b}
 
 Возвращает наименьшее значение из a и b.

From 726277adec1da5924da59883f17945a8e29e0195 Mon Sep 17 00:00:00 2001
From: Artem Hnilov <boobsd@gmail.com>
Date: Thu, 10 Sep 2020 20:34:23 +0300
Subject: [PATCH 125/341] Update other-functions.md

---
 .../functions/other-functions.md              | 23 +++++++++++++++++++
 1 file changed, 23 insertions(+)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index 05247b6db7d..1c059e9f97b 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -515,6 +515,29 @@ SELECT
 └────────────────┴────────────┘
 ```
 
+## formatReadableQuantity(x) {#formatreadablequantityx}
+
+Accepts the number. Returns a rounded number with a suffix (thousand, million, billion, etc.) as a string.
+
+It is useful for reading big numbers by human.
+
+Example:
+
+``` sql
+SELECT
+    arrayJoin([1024, 1234 * 1000, (4567 * 1000) * 1000, 98765432101234]) AS number,
+    formatReadableQuantity(number) AS number_for_humans
+```
+
+``` text
+┌─────────number─┬─number_for_humans─┐
+│           1024 │ 1.02 thousand     │
+│        1234000 │ 1.23 million      │
+│     4567000000 │ 4.57 billion      │
+│ 98765432101234 │ 98.77 trillion    │
+└────────────────┴───────────────────┘
+```
+
 ## least(a, b) {#leasta-b}
 
 Returns the smallest value from a and b.

From 54491b8608043871634973b997042864ca29bc6f Mon Sep 17 00:00:00 2001
From: Ivan Blinkov <github@blinkov.ru>
Date: Thu, 10 Sep 2020 22:23:23 +0300
Subject: [PATCH 126/341] Update README.md

---
 README.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/README.md b/README.md
index 7f6a102a2dd..f14f2e88886 100644
--- a/README.md
+++ b/README.md
@@ -17,5 +17,4 @@ ClickHouse is an open-source column-oriented database management system that all
 
 ## Upcoming Events		
 
-* [ClickHouse Data Integration Virtual Meetup](https://www.eventbrite.com/e/clickhouse-september-virtual-meetup-data-integration-tickets-117421895049) on September 10, 2020.
 * [ClickHouse talk at Ya.Subbotnik (in Russian)](https://ya.cc/t/cIBI-3yECj5JF) on September 12, 2020.

From f2a5216e97f1283b373720717f1d6f7ac79af86d Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Fri, 11 Sep 2020 02:24:16 +0300
Subject: [PATCH 127/341] add waiting for fsync in WAL

---
 src/Common/FileSyncGuard.h                        |  2 +-
 src/Storages/MergeTree/MergeTreeSettings.h        |  1 +
 src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp | 14 +++++++++-----
 src/Storages/MergeTree/MergeTreeWriteAheadLog.h   |  5 +++--
 utils/durability-test/durability-test.sh          | 12 ++++++++++++
 5 files changed, 26 insertions(+), 8 deletions(-)

diff --git a/src/Common/FileSyncGuard.h b/src/Common/FileSyncGuard.h
index 5ec9b1d0c98..6451f6ebf36 100644
--- a/src/Common/FileSyncGuard.h
+++ b/src/Common/FileSyncGuard.h
@@ -17,7 +17,7 @@ public:
     FileSyncGuard(const DiskPtr & disk_, int fd_) : disk(disk_), fd(fd_) {}
 
     FileSyncGuard(const DiskPtr & disk_, const String & path)
-        : disk(disk_), fd(disk_->open(path, O_RDONLY)) {}
+        : disk(disk_), fd(disk_->open(path, O_RDWR)) {}
 
     ~FileSyncGuard()
     {
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 3f8f44dc11e..8652a6ef691 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -47,6 +47,7 @@ struct Settings;
     M(Bool, fsync_part_directory, false, "Do fsync for part directory after all part operations (writes, renames, etc.).", 0) \
     M(UInt64, write_ahead_log_bytes_to_fsync, 100ULL * 1024 * 1024, "Amount of bytes, accumulated in WAL to do fsync.", 0) \
     M(UInt64, write_ahead_log_interval_ms_to_fsync, 100, "Interval in milliseconds after which fsync for WAL is being done.", 0) \
+    M(Bool, in_memory_parts_insert_sync, false, "If true insert of part with in-memory format will wait for fsync of WAL", 0) \
     \
     /** Inserts settings. */ \
     M(UInt64, parts_to_delay_insert, 150, "If table contains at least that many active parts in single partition, artificially slow down insert into table.", 0) \
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
index 5cfe9017248..bc6738a8321 100644
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
+++ b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
@@ -33,6 +33,7 @@ MergeTreeWriteAheadLog::MergeTreeWriteAheadLog(
         std::lock_guard lock(write_mutex);
         out->sync();
         sync_scheduled = false;
+        sync_cv.notify_all();
     });
 }
 
@@ -50,7 +51,7 @@ void MergeTreeWriteAheadLog::init()
 
 void MergeTreeWriteAheadLog::addPart(const Block & block, const String & part_name)
 {
-    std::lock_guard lock(write_mutex);
+    std::unique_lock lock(write_mutex);
 
     auto part_info = MergeTreePartInfo::fromPartName(part_name, storage.format_version);
     min_block_number = std::min(min_block_number, part_info.min_block);
@@ -70,7 +71,7 @@ void MergeTreeWriteAheadLog::addPart(const Block & block, const String & part_na
 
 void MergeTreeWriteAheadLog::dropPart(const String & part_name)
 {
-    std::lock_guard lock(write_mutex);
+    std::unique_lock lock(write_mutex);
 
     writeIntBinary(static_cast<UInt8>(0), *out);
     writeIntBinary(static_cast<UInt8>(ActionType::DROP_PART), *out);
@@ -78,7 +79,7 @@ void MergeTreeWriteAheadLog::dropPart(const String & part_name)
     sync(lock);
 }
 
-void MergeTreeWriteAheadLog::rotate(const std::lock_guard<std::mutex> &)
+void MergeTreeWriteAheadLog::rotate(const std::unique_lock<std::mutex> &)
 {
     String new_name = String(WAL_FILE_NAME) + "_"
         + toString(min_block_number) + "_"
@@ -90,7 +91,7 @@ void MergeTreeWriteAheadLog::rotate(const std::lock_guard<std::mutex> &)
 
 MergeTreeData::MutableDataPartsVector MergeTreeWriteAheadLog::restore(const StorageMetadataPtr & metadata_snapshot)
 {
-    std::lock_guard lock(write_mutex);
+    std::unique_lock lock(write_mutex);
 
     MergeTreeData::MutableDataPartsVector parts;
     auto in = disk->readFile(path, DBMS_DEFAULT_BUFFER_SIZE);
@@ -185,7 +186,7 @@ MergeTreeData::MutableDataPartsVector MergeTreeWriteAheadLog::restore(const Stor
     return result;
 }
 
-void MergeTreeWriteAheadLog::sync(const std::lock_guard<std::mutex> &)
+void MergeTreeWriteAheadLog::sync(std::unique_lock<std::mutex> & lock)
 {
     size_t bytes_to_sync = storage.getSettings()->write_ahead_log_bytes_to_fsync;
     time_t time_to_sync = storage.getSettings()->write_ahead_log_interval_ms_to_fsync;
@@ -201,6 +202,9 @@ void MergeTreeWriteAheadLog::sync(const std::lock_guard<std::mutex> &)
         sync_task->scheduleAfter(time_to_sync);
         sync_scheduled = true;
     }
+
+    if (storage.getSettings()->in_memory_parts_insert_sync)
+        sync_cv.wait(lock, [this] { return !sync_scheduled; });
 }
 
 std::optional<MergeTreeWriteAheadLog::MinMaxBlockNumber>
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.h b/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
index 43abf3c04be..c5675eac696 100644
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
+++ b/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
@@ -44,8 +44,8 @@ public:
 
 private:
     void init();
-    void rotate(const std::lock_guard<std::mutex> & lock);
-    void sync(const std::lock_guard<std::mutex> & lock);
+    void rotate(const std::unique_lock<std::mutex> & lock);
+    void sync(std::unique_lock<std::mutex> & lock);
 
     const MergeTreeData & storage;
     DiskPtr disk;
@@ -60,6 +60,7 @@ private:
 
     BackgroundSchedulePool & pool;
     BackgroundSchedulePoolTaskHolder sync_task;
+    std::condition_variable sync_cv;
 
     size_t bytes_at_last_sync = 0;
     bool sync_scheduled = false;
diff --git a/utils/durability-test/durability-test.sh b/utils/durability-test/durability-test.sh
index c7f8936ec95..97c39473b69 100755
--- a/utils/durability-test/durability-test.sh
+++ b/utils/durability-test/durability-test.sh
@@ -1,5 +1,17 @@
 #!/bin/bash
 
+: '
+A simple test for durability. It starts up clickhouse server in qemu VM and runs
+inserts via clickhouse benchmark tool. Then it kills VM in random moment and
+checks whether table contains broken parts. With enabled fsync no broken parts
+should be appeared.
+
+Usage:
+
+./install.sh
+./durability-test.sh <table name> <file with create query> <file with insert query>
+'
+
 URL=http://cloud-images.ubuntu.com/bionic/current
 IMAGE=bionic-server-cloudimg-amd64.img
 SSH_PORT=11022

From 2873777857351a939564e7fac0a285bf8222f19c Mon Sep 17 00:00:00 2001
From: BohuTANG <overred.shuttler@gmail.com>
Date: Fri, 11 Sep 2020 12:54:53 +0800
Subject: [PATCH 128/341] Ignore unprocessed replication payload

---
 src/Core/MySQL/MySQLReplication.cpp | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index 808e9d1a247..e7f113ba7af 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -171,9 +171,7 @@ namespace MySQLReplication
 
         /// Ignore MySQL 8.0 optional metadata fields.
         /// https://mysqlhighavailability.com/more-metadata-is-written-into-binary-log/
-        auto remain = payload.available();
-        if (remain > CHECKSUM_CRC32_SIGNATURE_LENGTH)
-           payload.ignore(remain);
+        payload.ignoreAll();
     }
 
     /// Types that do not used in the binlog event:
@@ -915,7 +913,7 @@ namespace MySQLReplication
                 break;
             }
         }
-        payload.tryIgnore(CHECKSUM_CRC32_SIGNATURE_LENGTH);
+        payload.ignoreAll();
     }
 }
 

From da2bb4e0d3d2e642993f070b923401a9db470d81 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Fri, 11 Sep 2020 15:46:14 +0800
Subject: [PATCH 129/341] Fix missing clone in replace column transformer

---
 src/Parsers/ASTColumnsTransformers.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/ASTColumnsTransformers.cpp b/src/Parsers/ASTColumnsTransformers.cpp
index 2625a03830b..43d54f07ab8 100644
--- a/src/Parsers/ASTColumnsTransformers.cpp
+++ b/src/Parsers/ASTColumnsTransformers.cpp
@@ -110,7 +110,7 @@ void ASTColumnsReplaceTransformer::replaceChildren(ASTPtr & node, const ASTPtr &
         if (const auto * id = child->as<ASTIdentifier>())
         {
             if (id->shortName() == name)
-                child = replacement;
+                child = replacement->clone();
         }
         else
             replaceChildren(child, replacement, name);

From 3b9ab3f1be330b5ae7ffd7c68fd629ad3ebc9f6b Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 12:23:31 +0300
Subject: [PATCH 130/341] Fix if

---
 src/Functions/if.cpp | 19 +++++++++++++++----
 1 file changed, 15 insertions(+), 4 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 20848bede32..584bed3f8c5 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -604,7 +604,6 @@ private:
         const ColumnUInt8 * cond_col, Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count)
     {
         /// Convert both columns to the common type (if needed).
-
         const ColumnWithTypeAndName & arg1 = block.getByPosition(arguments[1]);
         const ColumnWithTypeAndName & arg2 = block.getByPosition(arguments[2]);
 
@@ -765,10 +764,22 @@ private:
         return ColumnNullable::create(materialized, ColumnUInt8::create(column->size(), 0));
     }
 
-    static ColumnPtr getNestedColumn(const ColumnPtr & column)
+    /// Return nested column recursively removing Nullable, examples:
+    /// Nullable(size = 1, Int32(size = 1), UInt8(size = 1)) -> Int32(size = 1)
+    /// Const(size = 0, Nullable(size = 1, Int32(size = 1), UInt8(size = 1))) ->
+    /// Const(size = 0, Int32(size = 1))
+    static ColumnPtr recursiveGetNestedColumnWithoutNullable(const ColumnPtr & column)
     {
         if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*column))
+        {
+            /// Nullable cannot contain Nullable
             return nullable->getNestedColumnPtr();
+        }
+        else if (const auto * column_const = checkAndGetColumn<ColumnConst>(*column))
+        {
+            /// Save Constant, but remove Nullable
+            return ColumnConst::create(recursiveGetNestedColumnWithoutNullable(column_const->getDataColumnPtr()), column->size());
+        }
 
         return column;
     }
@@ -826,12 +837,12 @@ private:
             {
                 arg_cond,
                 {
-                    getNestedColumn(arg_then.column),
+                    recursiveGetNestedColumnWithoutNullable(arg_then.column),
                     removeNullable(arg_then.type),
                     ""
                 },
                 {
-                    getNestedColumn(arg_else.column),
+                    recursiveGetNestedColumnWithoutNullable(arg_else.column),
                     removeNullable(arg_else.type),
                     ""
                 },

From 5de3d9c03298101876df60eed11ca2499676faf5 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@yandex-team.ru>
Date: Fri, 11 Sep 2020 12:58:04 +0300
Subject: [PATCH 131/341] Update version_date.tsv after release 20.6.6.7

---
 utils/list-versions/version_date.tsv | 1 +
 1 file changed, 1 insertion(+)

diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index d97fdbfa080..3915000cec3 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,5 +1,6 @@
 v20.8.2.3-stable	2020-09-08
 v20.7.2.30-stable	2020-08-31
+v20.6.6.7-stable	2020-09-11
 v20.6.5.8-stable	2020-09-03
 v20.6.4.44-stable	2020-08-20
 v20.6.3.28-stable	2020-08-07

From e25b1da29fa168b24464c83c1f661b363916afad Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 13:53:26 +0300
Subject: [PATCH 132/341] Disable -Wstringop-overflow for gcc-10

---
 cmake/warnings.cmake                          | 11 +++++++++--
 src/Storages/MergeTree/MergeTreePartition.cpp |  8 --------
 2 files changed, 9 insertions(+), 10 deletions(-)

diff --git a/cmake/warnings.cmake b/cmake/warnings.cmake
index aec3e46ffa6..6b26b9b95a5 100644
--- a/cmake/warnings.cmake
+++ b/cmake/warnings.cmake
@@ -169,9 +169,16 @@ elseif (COMPILER_GCC)
     # Warn if vector operation is not implemented via SIMD capabilities of the architecture
     add_cxx_compile_options(-Wvector-operation-performance)
 
-    # XXX: gcc10 stuck with this option while compiling GatherUtils code
-    # (anyway there are builds with clang, that will warn)
     if (CMAKE_CXX_COMPILER_VERSION VERSION_GREATER_EQUAL 10)
+        # XXX: gcc10 stuck with this option while compiling GatherUtils code
+        # (anyway there are builds with clang, that will warn)
         add_cxx_compile_options(-Wno-sequence-point)
+        # XXX: gcc10 false positive with this warning in MergeTreePartition.cpp
+        #     inlined from 'void writeHexByteLowercase(UInt8, void*)' at ../src/Common/hex.h:39:11,
+        #     inlined from 'DB::String DB::MergeTreePartition::getID(const DB::Block&) const' at ../src/Storages/MergeTree/MergeTreePartition.cpp:85:30:
+        #     ../contrib/libc-headers/x86_64-linux-gnu/bits/string_fortified.h:34:33: error: writing 2 bytes into a region of size 0 [-Werror=stringop-overflow=]
+        #     34 |   return __builtin___memcpy_chk (__dest, __src, __len, __bos0 (__dest));
+        # For some reason (bug in gcc?) macro 'GCC diagnostic ignored "-Wstringop-overflow"' doesn't help.
+        add_cxx_compile_options(-Wno-stringop-overflow)
     endif()
 endif ()
diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index 2802b842f54..880a3aa181d 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -29,11 +29,6 @@ String MergeTreePartition::getID(const MergeTreeData & storage) const
     return getID(storage.getInMemoryMetadataPtr()->getPartitionKey().sample_block);
 }
 
-#if defined (__GNUC__) && __GNUC__ >= 10
-    #pragma GCC diagnostic push
-    #pragma GCC diagnostic ignored "-Wstringop-overflow"
-#endif
-
 /// NOTE: This ID is used to create part names which are then persisted in ZK and as directory names on the file system.
 /// So if you want to change this method, be sure to guarantee compatibility with existing table data.
 String MergeTreePartition::getID(const Block & partition_key_sample) const
@@ -92,9 +87,6 @@ String MergeTreePartition::getID(const Block & partition_key_sample) const
     return result;
 }
 
-#if defined (__GNUC__) && __GNUC__ >= 10
-    #pragma GCC diagnostic pop
-#endif
 
 void MergeTreePartition::serializeText(const MergeTreeData & storage, WriteBuffer & out, const FormatSettings & format_settings) const
 {

From c36192db233af7ce3f971a0cd950db4cfbb6175d Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 13:54:03 +0300
Subject: [PATCH 133/341] Remove diff

---
 src/Storages/MergeTree/MergeTreePartition.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index 880a3aa181d..4a846f63b7c 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -87,7 +87,6 @@ String MergeTreePartition::getID(const Block & partition_key_sample) const
     return result;
 }
 
-
 void MergeTreePartition::serializeText(const MergeTreeData & storage, WriteBuffer & out, const FormatSettings & format_settings) const
 {
     auto metadata_snapshot = storage.getInMemoryMetadataPtr();

From ebb9de1376d50e834b61b48cc2f4695513244ad9 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 14:13:41 +0300
Subject: [PATCH 134/341] Supress strange warning

---
 src/Functions/negate.cpp | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/src/Functions/negate.cpp b/src/Functions/negate.cpp
index 39ca434ea89..3101513648b 100644
--- a/src/Functions/negate.cpp
+++ b/src/Functions/negate.cpp
@@ -13,7 +13,14 @@ struct NegateImpl
 
     static inline NO_SANITIZE_UNDEFINED ResultType apply(A a)
     {
-        return -static_cast<ResultType>(a);
+#if defined (__GNUC__) && __GNUC__ >= 10
+    #pragma GCC diagnostic push
+    #pragma GCC diagnostic ignored "-Wvector-operation-performance"
+#endif
+        return -(static_cast<ResultType>(a));
+#if defined (__GNUC__) && __GNUC__ >= 10
+    #pragma GCC diagnostic pop
+#endif
     }
 
 #if USE_EMBEDDED_COMPILER

From 5ce0c21bbe3c08a0f5169bced9dcea208857c88a Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 14:24:42 +0300
Subject: [PATCH 135/341] Remove redundant change

---
 src/Functions/negate.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/negate.cpp b/src/Functions/negate.cpp
index 3101513648b..de3995927d3 100644
--- a/src/Functions/negate.cpp
+++ b/src/Functions/negate.cpp
@@ -17,7 +17,7 @@ struct NegateImpl
     #pragma GCC diagnostic push
     #pragma GCC diagnostic ignored "-Wvector-operation-performance"
 #endif
-        return -(static_cast<ResultType>(a));
+        return -static_cast<ResultType>(a);
 #if defined (__GNUC__) && __GNUC__ >= 10
     #pragma GCC diagnostic pop
 #endif

From eb7e480d399788dae32dc83bd4b32dfdc6ec1aa3 Mon Sep 17 00:00:00 2001
From: Roman Bug <rrrrrroman@gmail.com>
Date: Fri, 11 Sep 2020 15:47:36 +0300
Subject: [PATCH 136/341] DOCSUP-2040: Translate PR to RU (#14551)

* DOCSUP-2040: Update by PR#1127.

* DOCSUP-2040: Update by PR#11088.

* DOCSUP-2040: Update by PR#10923.

* DOCSUP-2040: Minor fix.

* Update docs/ru/sql-reference/functions/random-functions.md

Co-authored-by: Ilya Yatsishin <2159081+qoega@users.noreply.github.com>

* Update docs/ru/sql-reference/functions/type-conversion-functions.md

Co-authored-by: Ilya Yatsishin <2159081+qoega@users.noreply.github.com>

* Update translation.

* Update docs/ru/sql-reference/functions/type-conversion-functions.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

* Update docs/ru/sql-reference/functions/random-functions.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

* Update docs/ru/sql-reference/functions/type-conversion-functions.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

* Update docs/ru/sql-reference/functions/type-conversion-functions.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

Co-authored-by: romanzhukov <romanzhukov@yandex-team.ru>
Co-authored-by: Ilya Yatsishin <2159081+qoega@users.noreply.github.com>
Co-authored-by: BayoNet <da-daos@yandex.ru>
---
 docs/ru/interfaces/formats.md                 | 20 +++-
 .../functions/random-functions.md             | 46 ++++++++++
 .../functions/type-conversion-functions.md    | 91 +++++++++++++++++++
 3 files changed, 156 insertions(+), 1 deletion(-)

diff --git a/docs/ru/interfaces/formats.md b/docs/ru/interfaces/formats.md
index 054f75e8da8..04bca115974 100644
--- a/docs/ru/interfaces/formats.md
+++ b/docs/ru/interfaces/formats.md
@@ -28,6 +28,8 @@ ClickHouse может принимать (`INSERT`) и отдавать (`SELECT
 | [PrettySpace](#prettyspace)                                     | ✗      | ✔      |
 | [Protobuf](#protobuf)                                           | ✔      | ✔      |
 | [Parquet](#data-format-parquet)                                 | ✔      | ✔      |
+| [Arrow](#data-format-arrow)                                     | ✔      | ✔      |
+| [ArrowStream](#data-format-arrow-stream)                        | ✔      | ✔      |
 | [ORC](#data-format-orc)                                         | ✔      | ✗      |
 | [RowBinary](#rowbinary)                                         | ✔      | ✔      |
 | [RowBinaryWithNamesAndTypes](#rowbinarywithnamesandtypes)       | ✔      | ✔      |
@@ -947,6 +949,12 @@ ClickHouse пишет и читает сообщения `Protocol Buffers` в 
 
 ## Avro {#data-format-avro}
 
+[Apache Avro](https://avro.apache.org/) — это ориентированный на строки фреймворк для сериализации данных. Разработан в рамках проекта Apache Hadoop.
+
+В ClickHouse формат Avro поддерживает чтение и запись [файлов данных Avro](https://avro.apache.org/docs/current/spec.html#Object+Container+Files).
+
+[Логические типы Avro](https://avro.apache.org/docs/current/spec.html#Logical+Types)
+
 ## AvroConfluent {#data-format-avro-confluent}
 
 Для формата `AvroConfluent` ClickHouse поддерживает декодирование сообщений `Avro` с одним объектом. Такие сообщения используются с [Kafka] (http://kafka.apache.org/) и  реестром схем [Confluent](https://docs.confluent.io/current/schema-registry/index.html). 
@@ -996,7 +1004,7 @@ SELECT * FROM topic1_stream;
 
 ## Parquet {#data-format-parquet}
 
-[Apache Parquet](http://parquet.apache.org/) — формат поколоночного хранения данных, который распространён в экосистеме Hadoop. Для формата `Parquet` ClickHouse поддерживает операции чтения и записи.
+[Apache Parquet](https://parquet.apache.org/) — формат поколоночного хранения данных, который распространён в экосистеме Hadoop. Для формата `Parquet` ClickHouse поддерживает операции чтения и записи.
 
 ### Соответствие типов данных {#sootvetstvie-tipov-dannykh}
 
@@ -1042,6 +1050,16 @@ $ clickhouse-client --query="SELECT * FROM {some_table} FORMAT Parquet" > {some_
 
 Для обмена данными с экосистемой Hadoop можно использовать движки таблиц [HDFS](../engines/table-engines/integrations/hdfs.md).
 
+## Arrow {data-format-arrow}
+
+[Apache Arrow](https://arrow.apache.org/) поставляется с двумя встроенными поколоночнами форматами хранения. ClickHouse поддерживает операции чтения и записи для этих форматов.
+
+`Arrow` — это Apache Arrow's "file mode" формат. Он предназначен для произвольного доступа в памяти.
+
+## ArrowStream {data-format-arrow-stream}
+
+`ArrowStream` — это Apache Arrow's "stream mode" формат. Он предназначен для обработки потоков в памяти.
+
 ## ORC {#data-format-orc}
 
 [Apache ORC](https://orc.apache.org/) - это column-oriented формат данных, распространённый в экосистеме Hadoop. Вы можете только вставлять данные этого формата в ClickHouse.
diff --git a/docs/ru/sql-reference/functions/random-functions.md b/docs/ru/sql-reference/functions/random-functions.md
index b425505b69d..4aaaef5cb5d 100644
--- a/docs/ru/sql-reference/functions/random-functions.md
+++ b/docs/ru/sql-reference/functions/random-functions.md
@@ -55,4 +55,50 @@ FROM numbers(3)
 └────────────┴────────────┴──────────────┴────────────────┴─────────────────┴──────────────────────┘
 ```
 
+# Случайные функции для работы со строками {#random-functions-for-working-with-strings}
+
+## randomString {#random-string}
+
+## randomFixedString {#random-fixed-string}
+
+## randomPrintableASCII {#random-printable-ascii}
+
+## randomStringUTF8 {#random-string-utf8}
+
+## fuzzBits {#fuzzbits}
+
+**Синтаксис**
+
+``` sql
+fuzzBits([s], [prob])
+```
+Инвертирует каждый бит `s` с вероятностью `prob`.
+
+**Параметры**
+
+- `s` — `String` or `FixedString`
+- `prob` — constant `Float32/64`
+
+**Возвращаемое значение**
+
+Измененная случайным образом строка с тем же типом, что и `s`.
+
+**Пример**
+
+Запрос:
+
+``` sql
+SELECT fuzzBits(materialize('abacaba'), 0.1)
+FROM numbers(3)
+```
+
+Результат:
+
+``` text
+┌─fuzzBits(materialize('abacaba'), 0.1)─┐
+│ abaaaja                               │
+│ a*cjab+                               │
+│ aeca2A                                │
+└───────────────────────────────────────┘
+
 [Оригинальная статья](https://clickhouse.tech/docs/ru/query_language/functions/random_functions/) <!--hide-->
diff --git a/docs/ru/sql-reference/functions/type-conversion-functions.md b/docs/ru/sql-reference/functions/type-conversion-functions.md
index 41ded78055c..c7d74a9d881 100644
--- a/docs/ru/sql-reference/functions/type-conversion-functions.md
+++ b/docs/ru/sql-reference/functions/type-conversion-functions.md
@@ -513,4 +513,95 @@ SELECT parseDateTimeBestEffort('10 20:19')
 -   [toDate](#todate)
 -   [toDateTime](#todatetime)
 
+## toUnixTimestamp64Milli
+## toUnixTimestamp64Micro
+## toUnixTimestamp64Nano
+
+Преобразует значение `DateTime64` в значение `Int64` с фиксированной точностью менее одной секунды. 
+Входное значение округляется соответствующим образом вверх или вниз в зависимости от его точности. Обратите внимание, что возвращаемое значение - это временная метка в UTC, а не в часовом поясе `DateTime64`.
+
+**Синтаксис**
+
+``` sql
+toUnixTimestamp64Milli(value)
+```
+
+**Параметры**
+
+-   `value` — значение `DateTime64` с любой точностью.
+
+**Возвращаемое значение**
+
+-   Значение `value`, преобразованное в тип данных `Int64`.
+
+**Примеры**
+
+Запрос:
+
+``` sql
+WITH toDateTime64('2019-09-16 19:20:12.345678910', 6) AS dt64
+SELECT toUnixTimestamp64Milli(dt64)
+```
+
+Ответ:
+
+``` text
+┌─toUnixTimestamp64Milli(dt64)─┐
+│                1568650812345 │
+└──────────────────────────────┘
+```
+
+Запрос: 
+
+``` sql
+WITH toDateTime64('2019-09-16 19:20:12.345678910', 6) AS dt64
+SELECT toUnixTimestamp64Nano(dt64)
+```
+
+Ответ:
+
+``` text
+┌─toUnixTimestamp64Nano(dt64)─┐
+│         1568650812345678000 │
+└─────────────────────────────┘
+```
+
+## fromUnixTimestamp64Milli
+## fromUnixTimestamp64Micro
+## fromUnixTimestamp64Nano
+
+Преобразует значение `Int64` в значение `DateTime64` с фиксированной точностью менее одной секунды и дополнительным часовым поясом. Входное значение округляется соответствующим образом вверх или вниз в зависимости от его точности. Обратите внимание, что входное значение обрабатывается как метка времени UTC, а не метка времени в заданном (или неявном) часовом поясе.
+
+**Синтаксис**
+
+``` sql
+fromUnixTimestamp64Milli(value [, ti])
+```
+
+**Параметры**
+
+-   `value` — значение типы `Int64` с любой точностью.
+-   `timezone` — (не обязательный параметр) часовой пояс в формате `String` для возвращаемого результата.
+
+**Возвращаемое значение**
+
+-   Значение `value`, преобразованное в тип данных `DateTime64`.
+
+**Пример**
+
+Запрос:
+
+``` sql
+WITH CAST(1234567891011, 'Int64') AS i64
+SELECT fromUnixTimestamp64Milli(i64, 'UTC')
+```
+
+Ответ:
+
+``` text
+┌─fromUnixTimestamp64Milli(i64, 'UTC')─┐
+│              2009-02-13 23:31:31.011 │
+└──────────────────────────────────────┘
+```
+
 [Оригинальная статья](https://clickhouse.tech/docs/ru/query_language/functions/type_conversion_functions/) <!--hide-->

From a64331d79f04bb9321383269150fe8302289e9b2 Mon Sep 17 00:00:00 2001
From: Anton Popov <pad11rus@gmail.com>
Date: Fri, 11 Sep 2020 16:09:26 +0300
Subject: [PATCH 137/341] fix syncing of WAL

---
 src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp | 7 +++++++
 src/Storages/MergeTree/MergeTreeWriteAheadLog.h   | 2 ++
 2 files changed, 9 insertions(+)

diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
index bc6738a8321..35fadb999b4 100644
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
+++ b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
@@ -37,6 +37,13 @@ MergeTreeWriteAheadLog::MergeTreeWriteAheadLog(
     });
 }
 
+MergeTreeWriteAheadLog::~MergeTreeWriteAheadLog()
+{
+    std::unique_lock lock(write_mutex);
+    if (sync_scheduled)
+        sync_cv.wait(lock, [this] { return !sync_scheduled; });
+}
+
 void MergeTreeWriteAheadLog::init()
 {
     out = disk->writeFile(path, DBMS_DEFAULT_BUFFER_SIZE, WriteMode::Append);
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.h b/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
index c5675eac696..77c7c7e11e7 100644
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
+++ b/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
@@ -35,6 +35,8 @@ public:
     MergeTreeWriteAheadLog(MergeTreeData & storage_, const DiskPtr & disk_,
         const String & name = DEFAULT_WAL_FILE_NAME);
 
+    ~MergeTreeWriteAheadLog();
+
     void addPart(const Block & block, const String & part_name);
     void dropPart(const String & part_name);
     std::vector<MergeTreeMutableDataPartPtr> restore(const StorageMetadataPtr & metadata_snapshot);

From 6dd764bcfe5b28d3ccb89ca950558bd82c911847 Mon Sep 17 00:00:00 2001
From: Artem Zuikov <chertus@gmail.com>
Date: Fri, 11 Sep 2020 18:12:08 +0300
Subject: [PATCH 138/341] FunctionBinaryArithmetic refactoring (#14712)

---
 src/Functions/FunctionBinaryArithmetic.h | 165 ++++++++++-------------
 src/Functions/divide.cpp                 |   1 -
 src/Functions/minus.cpp                  |   1 -
 src/Functions/multiply.cpp               |   1 -
 src/Functions/plus.cpp                   |   2 +-
 5 files changed, 72 insertions(+), 98 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 15b6ea6ca5d..ca0cc876035 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -561,6 +561,8 @@ public:
 template <template <typename, typename> class Op, typename Name, bool valid_on_default_arguments = true>
 class FunctionBinaryArithmetic : public IFunction
 {
+    static constexpr const bool is_plus = IsOperation<Op>::plus;
+    static constexpr const bool is_minus = IsOperation<Op>::minus;
     static constexpr const bool is_multiply = IsOperation<Op>::multiply;
     static constexpr const bool is_division = IsOperation<Op>::division;
 
@@ -612,9 +614,7 @@ class FunctionBinaryArithmetic : public IFunction
         /// Special case when the function is plus or minus, one of arguments is Date/DateTime and another is Interval.
         /// We construct another function (example: addMonths) and call it.
 
-        static constexpr bool function_is_plus = IsOperation<Op>::plus;
-        static constexpr bool function_is_minus = IsOperation<Op>::minus;
-        if constexpr (!function_is_plus && !function_is_minus)
+        if constexpr (!is_plus && !is_minus)
             return {};
 
         const DataTypePtr & type_time = first_is_date_or_datetime ? type0 : type1;
@@ -631,21 +631,21 @@ class FunctionBinaryArithmetic : public IFunction
                 return {};
         }
 
-        if (second_is_date_or_datetime && function_is_minus)
+        if (second_is_date_or_datetime && is_minus)
             throw Exception("Wrong order of arguments for function " + getName() + ": argument of type Interval cannot be first.",
                 ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
 
         std::string function_name;
         if (interval_data_type)
         {
-            function_name = String(function_is_plus ? "add" : "subtract") + interval_data_type->getKind().toString() + 's';
+            function_name = String(is_plus ? "add" : "subtract") + interval_data_type->getKind().toString() + 's';
         }
         else
         {
             if (isDate(type_time))
-                function_name = function_is_plus ? "addDays" : "subtractDays";
+                function_name = is_plus ? "addDays" : "subtractDays";
             else
-                function_name = function_is_plus ? "addSeconds" : "subtractSeconds";
+                function_name = is_plus ? "addSeconds" : "subtractSeconds";
         }
 
         return FunctionFactory::instance().get(function_name, context);
@@ -653,7 +653,7 @@ class FunctionBinaryArithmetic : public IFunction
 
     bool isAggregateMultiply(const DataTypePtr & type0, const DataTypePtr & type1) const
     {
-        if constexpr (!IsOperation<Op>::multiply)
+        if constexpr (!is_multiply)
             return false;
 
         WhichDataType which0(type0);
@@ -665,7 +665,7 @@ class FunctionBinaryArithmetic : public IFunction
 
     bool isAggregateAddition(const DataTypePtr & type0, const DataTypePtr & type1) const
     {
-        if constexpr (!IsOperation<Op>::plus)
+        if constexpr (!is_plus)
             return false;
 
         WhichDataType which0(type0);
@@ -994,8 +994,6 @@ public:
 
         if constexpr (!std::is_same_v<ResultDataType, InvalidType>)
         {
-            constexpr bool result_is_decimal = IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>;
-
             using T0 = typename LeftDataType::FieldType;
             using T1 = typename RightDataType::FieldType;
             using ResultType = typename ResultDataType::FieldType;
@@ -1003,112 +1001,91 @@ public:
             using ColVecT1 = std::conditional_t<IsDecimalNumber<T1>, ColumnDecimal<T1>, ColumnVector<T1>>;
             using ColVecResult = std::conditional_t<IsDecimalNumber<ResultType>, ColumnDecimal<ResultType>, ColumnVector<ResultType>>;
 
-            /// Decimal operations need scale. Operations are on result type.
-            using OpImpl = std::conditional_t<IsDataTypeDecimal<ResultDataType>,
-                DecimalBinaryOperation<T0, T1, Op, ResultType>,
-                BinaryOperationImpl<T0, T1, Op<T0, T1>, ResultType>>;
-
             auto col_left_raw = block.getByPosition(arguments[0]).column.get();
             auto col_right_raw = block.getByPosition(arguments[1]).column.get();
-            if (auto col_left = checkAndGetColumnConst<ColVecT0>(col_left_raw))
-            {
-                if (auto col_right = checkAndGetColumnConst<ColVecT1>(col_right_raw))
-                {
-                    /// the only case with a non-vector result
-                    if constexpr (result_is_decimal)
-                    {
-                        ResultDataType type = decimalResultType<is_multiply, is_division>(left, right);
-                        typename ResultDataType::FieldType scale_a = type.scaleFactorFor(left, is_multiply);
-                        typename ResultDataType::FieldType scale_b = type.scaleFactorFor(right, is_multiply || is_division);
-                        if constexpr (IsDataTypeDecimal<RightDataType> && is_division)
-                            scale_a = right.getScaleMultiplier();
 
-                        auto res = OpImpl::constantConstant(col_left->template getValue<T0>(), col_right->template getValue<T1>(),
-                                                                scale_a, scale_b, check_decimal_overflow);
-                        block.getByPosition(result).column =
-                            ResultDataType(type.getPrecision(), type.getScale()).createColumnConst(
-                                col_left->size(), toField(res, type.getScale()));
-
-                    }
-                    else
-                    {
-                        auto res = OpImpl::constantConstant(col_left->template getValue<T0>(), col_right->template getValue<T1>());
-                        block.getByPosition(result).column = ResultDataType().createColumnConst(col_left->size(), toField(res));
-                    }
-                    return true;
-                }
-            }
+            auto col_left_const = checkAndGetColumnConst<ColVecT0>(col_left_raw);
+            auto col_right_const = checkAndGetColumnConst<ColVecT1>(col_right_raw);
 
             typename ColVecResult::MutablePtr col_res = nullptr;
-            if constexpr (result_is_decimal)
+
+            auto col_left = checkAndGetColumn<ColVecT0>(col_left_raw);
+            auto col_right = checkAndGetColumn<ColVecT1>(col_right_raw);
+
+            if constexpr (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>)
             {
+                using OpImpl = DecimalBinaryOperation<T0, T1, Op, ResultType>;
+
                 ResultDataType type = decimalResultType<is_multiply, is_division>(left, right);
-                col_res = ColVecResult::create(0, type.getScale());
-            }
-            else
-                col_res = ColVecResult::create();
 
-            auto & vec_res = col_res->getData();
-            vec_res.resize(block.rows());
+                typename ResultDataType::FieldType scale_a = type.scaleFactorFor(left, is_multiply);
+                typename ResultDataType::FieldType scale_b = type.scaleFactorFor(right, is_multiply || is_division);
+                if constexpr (IsDataTypeDecimal<RightDataType> && is_division)
+                    scale_a = right.getScaleMultiplier();
 
-            if (auto col_left_const = checkAndGetColumnConst<ColVecT0>(col_left_raw))
-            {
-                if (auto col_right = checkAndGetColumn<ColVecT1>(col_right_raw))
+                /// non-vector result
+                if (col_left_const && col_right_const)
                 {
-                    if constexpr (result_is_decimal)
-                    {
-                        ResultDataType type = decimalResultType<is_multiply, is_division>(left, right);
+                    auto res = OpImpl::constantConstant(col_left_const->template getValue<T0>(), col_right_const->template getValue<T1>(),
+                                                        scale_a, scale_b, check_decimal_overflow);
 
-                        typename ResultDataType::FieldType scale_a = type.scaleFactorFor(left, is_multiply);
-                        typename ResultDataType::FieldType scale_b = type.scaleFactorFor(right, is_multiply || is_division);
-                        if constexpr (IsDataTypeDecimal<RightDataType> && is_division)
-                            scale_a = right.getScaleMultiplier();
+                    block.getByPosition(result).column = ResultDataType(type.getPrecision(), type.getScale()).createColumnConst(
+                            col_left_const->size(), toField(res, type.getScale()));
+                    return true;
+                }
 
-                        OpImpl::constantVector(col_left_const->template getValue<T0>(), col_right->getData(), vec_res,
-                                                scale_a, scale_b, check_decimal_overflow);
-                    }
-                    else
-                        OpImpl::constantVector(col_left_const->template getValue<T0>(), col_right->getData().data(), vec_res.data(), vec_res.size());
+                col_res = ColVecResult::create(0, type.getScale());
+                auto & vec_res = col_res->getData();
+                vec_res.resize(block.rows());
+
+                if (col_left && col_right)
+                {
+                    OpImpl::vectorVector(col_left->getData(), col_right->getData(), vec_res, scale_a, scale_b, check_decimal_overflow);
+                }
+                else if (col_left_const && col_right)
+                {
+                    OpImpl::constantVector(col_left_const->template getValue<T0>(), col_right->getData(), vec_res,
+                                           scale_a, scale_b, check_decimal_overflow);
+                }
+                else if (col_left && col_right_const)
+                {
+                    OpImpl::vectorConstant(col_left->getData(), col_right_const->template getValue<T1>(), vec_res,
+                                           scale_a, scale_b, check_decimal_overflow);
                 }
                 else
                     return false;
             }
-            else if (auto col_left = checkAndGetColumn<ColVecT0>(col_left_raw))
+            else
             {
-                if constexpr (result_is_decimal)
+                using OpImpl = BinaryOperationImpl<T0, T1, Op<T0, T1>, ResultType>;
+
+                /// non-vector result
+                if (col_left_const && col_right_const)
                 {
-                    ResultDataType type = decimalResultType<is_multiply, is_division>(left, right);
+                    auto res = OpImpl::constantConstant(col_left_const->template getValue<T0>(), col_right_const->template getValue<T1>());
+                    block.getByPosition(result).column = ResultDataType().createColumnConst(col_left_const->size(), toField(res));
+                    return true;
+                }
 
-                    typename ResultDataType::FieldType scale_a = type.scaleFactorFor(left, is_multiply);
-                    typename ResultDataType::FieldType scale_b = type.scaleFactorFor(right, is_multiply || is_division);
-                    if constexpr (IsDataTypeDecimal<RightDataType> && is_division)
-                        scale_a = right.getScaleMultiplier();
+                col_res = ColVecResult::create();
+                auto & vec_res = col_res->getData();
+                vec_res.resize(block.rows());
 
-                    if (auto col_right = checkAndGetColumn<ColVecT1>(col_right_raw))
-                    {
-                        OpImpl::vectorVector(col_left->getData(), col_right->getData(), vec_res, scale_a, scale_b,
-                                              check_decimal_overflow);
-                    }
-                    else if (auto col_right_const = checkAndGetColumnConst<ColVecT1>(col_right_raw))
-                    {
-                        OpImpl::vectorConstant(col_left->getData(), col_right_const->template getValue<T1>(), vec_res,
-                                                scale_a, scale_b, check_decimal_overflow);
-                    }
-                    else
-                        return false;
+                if (col_left && col_right)
+                {
+                    OpImpl::vectorVector(col_left->getData().data(), col_right->getData().data(), vec_res.data(), vec_res.size());
+                }
+                else if (col_left_const && col_right)
+                {
+                    OpImpl::constantVector(col_left_const->template getValue<T0>(), col_right->getData().data(), vec_res.data(), vec_res.size());
+                }
+                else if (col_left && col_right_const)
+                {
+                    OpImpl::vectorConstant(col_left->getData().data(), col_right_const->template getValue<T1>(), vec_res.data(), vec_res.size());
                 }
                 else
-                {
-                    if (auto col_right = checkAndGetColumn<ColVecT1>(col_right_raw))
-                        OpImpl::vectorVector(col_left->getData().data(), col_right->getData().data(), vec_res.data(), vec_res.size());
-                    else if (auto col_right_const = checkAndGetColumnConst<ColVecT1>(col_right_raw))
-                        OpImpl::vectorConstant(col_left->getData().data(), col_right_const->template getValue<T1>(), vec_res.data(), vec_res.size());
-                    else
-                        return false;
-                }
+                    return false;
             }
-            else
-                return false;
 
             block.getByPosition(result).column = std::move(col_res);
             return true;
diff --git a/src/Functions/divide.cpp b/src/Functions/divide.cpp
index cfc535320ed..98bfec08ccd 100644
--- a/src/Functions/divide.cpp
+++ b/src/Functions/divide.cpp
@@ -13,7 +13,6 @@ template <typename A, typename B>
 struct DivideFloatingImpl
 {
     using ResultType = typename NumberTraits::ResultOfFloatingPointDivision<A, B>::Type;
-    static const constexpr bool allow_decimal = true;
     static const constexpr bool allow_fixed_string = false;
 
     template <typename Result = ResultType>
diff --git a/src/Functions/minus.cpp b/src/Functions/minus.cpp
index cacde3936d9..e362855c206 100644
--- a/src/Functions/minus.cpp
+++ b/src/Functions/minus.cpp
@@ -9,7 +9,6 @@ template <typename A, typename B>
 struct MinusImpl
 {
     using ResultType = typename NumberTraits::ResultOfSubtraction<A, B>::Type;
-    static const constexpr bool allow_decimal = true;
     static const constexpr bool allow_fixed_string = false;
 
     template <typename Result = ResultType>
diff --git a/src/Functions/multiply.cpp b/src/Functions/multiply.cpp
index 7018da843b6..62cbdb49ffb 100644
--- a/src/Functions/multiply.cpp
+++ b/src/Functions/multiply.cpp
@@ -9,7 +9,6 @@ template <typename A, typename B>
 struct MultiplyImpl
 {
     using ResultType = typename NumberTraits::ResultOfAdditionMultiplication<A, B>::Type;
-    static const constexpr bool allow_decimal = true;
     static const constexpr bool allow_fixed_string = false;
 
     template <typename Result = ResultType>
diff --git a/src/Functions/plus.cpp b/src/Functions/plus.cpp
index 1421bfcd4c6..16b5bfba309 100644
--- a/src/Functions/plus.cpp
+++ b/src/Functions/plus.cpp
@@ -9,8 +9,8 @@ template <typename A, typename B>
 struct PlusImpl
 {
     using ResultType = typename NumberTraits::ResultOfAdditionMultiplication<A, B>::Type;
-    static const constexpr bool allow_decimal = true;
     static const constexpr bool allow_fixed_string = false;
+    static const constexpr bool is_commutative = true;
 
     template <typename Result = ResultType>
     static inline NO_SANITIZE_UNDEFINED Result apply(A a, B b)

From 7bbf7b295095cf6b9315ae9533b82d5ef9e519bc Mon Sep 17 00:00:00 2001
From: Vxider <lb@vxider.com>
Date: Fri, 11 Sep 2020 23:26:01 +0800
Subject: [PATCH 139/341] improvement chinese translation of remote.md

---
 .../sql-reference/table-functions/remote.md   | 29 +++++++------------
 1 file changed, 11 insertions(+), 18 deletions(-)

diff --git a/docs/zh/sql-reference/table-functions/remote.md b/docs/zh/sql-reference/table-functions/remote.md
index 1125353e2fa..3ec1da3cd2c 100644
--- a/docs/zh/sql-reference/table-functions/remote.md
+++ b/docs/zh/sql-reference/table-functions/remote.md
@@ -1,13 +1,6 @@
----
-machine_translated: true
-machine_translated_rev: 72537a2d527c63c07aa5d2361a8829f3895cf2bd
-toc_priority: 40
-toc_title: "\u8FDC\u7A0B"
----
-
 # 远程，远程安全 {#remote-remotesecure}
 
-允许您访问远程服务器，而无需创建 `Distributed` 桌子
+允许您访问远程服务器，而无需创建 `Distributed` 表
 
 签名:
 
@@ -18,10 +11,10 @@ remoteSecure('addresses_expr', db, table[, 'user'[, 'password']])
 remoteSecure('addresses_expr', db.table[, 'user'[, 'password']])
 ```
 
-`addresses_expr` – An expression that generates addresses of remote servers. This may be just one server address. The server address is `host:port`，或者只是 `host`. 主机可以指定为服务器名称，也可以指定为IPv4或IPv6地址。 IPv6地址在方括号中指定。 端口是远程服务器上的TCP端口。 如果省略端口，它使用 `tcp_port` 从服务器的配置文件（默认情况下，9000）。
+`addresses_expr` – 代表远程服务器地址的一个表达式。可以只是单个服务器地址。 服务器地址可以是 `host:port` 或 `host`。`host` 可以指定为服务器域名，或是IPV4或IPV6地址。IPv6地址在方括号中指定。`port` 是远程服务器上的TCP端口。 如果省略端口，则使用服务器配置文件中的 `tcp_port` （默认情况为，9000）。
 
 !!! important "重要事项"
-    IPv6地址需要该端口。
+    IPv6地址需要指定端口。
 
 例:
 
@@ -34,7 +27,7 @@ localhost
 [2a02:6b8:0:1111::11]:9000
 ```
 
-多个地址可以用逗号分隔。 在这种情况下，ClickHouse将使用分布式处理，因此它将将查询发送到所有指定的地址（如具有不同数据的分片）。
+多个地址可以用逗号分隔。在这种情况下，ClickHouse将使用分布式处理，因此它将将查询发送到所有指定的地址（如具有不同数据的分片）。
 
 示例:
 
@@ -56,7 +49,7 @@ example01-{01..02}-1
 
 如果您有多对大括号，它会生成相应集合的直接乘积。
 
-大括号中的地址和部分地址可以用管道符号(\|)分隔。 在这种情况下，相应的地址集被解释为副本，并且查询将被发送到第一个正常副本。 但是，副本将按照当前设置的顺序进行迭代 [load\_balancing](../../operations/settings/settings.md) 设置。
+大括号中的地址和部分地址可以用管道符号(\|)分隔。 在这种情况下，相应的地址集被解释为副本，并且查询将被发送到第一个正常副本。 但是，副本将按照当前[load\_balancing](../../operations/settings/settings.md)设置的顺序进行迭代。
 
 示例:
 
@@ -66,20 +59,20 @@ example01-{01..02}-{1|2}
 
 此示例指定两个分片，每个分片都有两个副本。
 
-生成的地址数由常量限制。 现在这是1000个地址。
+生成的地址数由常量限制。目前这是1000个地址。
 
-使用 `remote` 表函数比创建一个不太优化 `Distributed` 表，因为在这种情况下，服务器连接被重新建立为每个请求。 此外，如果设置了主机名，则会解析这些名称，并且在使用各种副本时不会计算错误。 在处理大量查询时，始终创建 `Distributed` 表的时间提前，不要使用 `remote` 表功能。
+使用 `remote` 表函数没有创建一个 `Distributed` 表更优，因为在这种情况下，将为每个请求重新建立服务器连接。此外，如果设置了主机名，则会解析这些名称，并且在使用各种副本时不会计算错误。 在处理大量查询时，始终优先创建 `Distributed` 表，不要使用 `remote` 表功能。
 
 该 `remote` 表函数可以在以下情况下是有用的:
 
 -   访问特定服务器进行数据比较、调试和测试。
--   查询之间的各种ClickHouse群集用于研究目的。
--   手动发出的罕见分布式请求。
+-   在多个ClickHouse集群之间的用户研究目的的查询。
+-   手动发出的不频繁分布式请求。
 -   每次重新定义服务器集的分布式请求。
 
-如果未指定用户, `default` 被使用。
+如果未指定用户, 将会使用`default`。
 如果未指定密码，则使用空密码。
 
-`remoteSecure` -相同 `remote` but with secured connection. Default port — [tcp\_port\_secure](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-tcp_port_secure) 从配置或9440.
+`remoteSecure` - 与 `remote` 相同，但是会使用加密链接。默认端口 — [tcp\_port\_secure](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-tcp_port_secure) 配置文件或或9440.
 
 [原始文章](https://clickhouse.tech/docs/en/query_language/table_functions/remote/) <!--hide-->

From d9394fbf66b5313d5c07bfc3d2e9119837516525 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 18:51:08 +0300
Subject: [PATCH 140/341] Fix code

---
 src/Core/MultiEnum.h    | 4 ++--
 tests/ci/ci_config.json | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Core/MultiEnum.h b/src/Core/MultiEnum.h
index 748550a8779..ddfc5b13e86 100644
--- a/src/Core/MultiEnum.h
+++ b/src/Core/MultiEnum.h
@@ -83,13 +83,13 @@ struct MultiEnum
     template <typename ValueType, typename = std::enable_if_t<std::is_convertible_v<ValueType, StorageType>>>
     friend bool operator==(ValueType left, MultiEnum right)
     {
-        return right == left;
+        return right.operator==(left);
     }
 
     template <typename L>
     friend bool operator!=(L left, MultiEnum right)
     {
-        return !(right == left);
+        return !(right.operator==(left));
     }
 
 private:
diff --git a/tests/ci/ci_config.json b/tests/ci/ci_config.json
index adb736a8df3..9a11a06db0d 100644
--- a/tests/ci/ci_config.json
+++ b/tests/ci/ci_config.json
@@ -92,7 +92,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "gcc-10",
+            "compiler": "gcc-9",
             "build-type": "",
             "sanitizer": "",
             "package-type": "deb",

From 31dbfd07e22a307992ac868590eb8a794178630d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 11 Sep 2020 16:16:24 +0000
Subject: [PATCH 141/341] remove tests crash reason

---
 tests/integration/test_storage_rabbitmq/test.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index c5b65d60de6..370515956ea 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -24,8 +24,8 @@ import rabbitmq_pb2
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance',
                                 main_configs=['configs/rabbitmq.xml','configs/log_conf.xml'],
-                                with_rabbitmq=True,
-                                clickhouse_path_dir='clickhouse_path')
+                                with_rabbitmq=True)
+#                                clickhouse_path_dir='clickhouse_path')
 rabbitmq_id = ''
 
 
@@ -431,6 +431,7 @@ def test_rabbitmq_many_materialized_views(rabbitmq_cluster):
     rabbitmq_check_result(result2, True)
 
 
+@pytest.mark.skip(reason="clichouse_path with rabbitmq.proto fails to be exported")
 @pytest.mark.timeout(180)
 def test_rabbitmq_protobuf(rabbitmq_cluster):
     instance.query('''

From b96da75ead4e291d3ca6f9785ebe9b361688f311 Mon Sep 17 00:00:00 2001
From: nikitamikhaylov <mikhaylovnikitka@gmail.com>
Date: Fri, 11 Sep 2020 19:44:14 +0300
Subject: [PATCH 142/341] done

---
 tests/queries/0_stateless/arcadia_skip_list.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/arcadia_skip_list.txt b/tests/queries/0_stateless/arcadia_skip_list.txt
index 71e67c811cd..aa8a9f48ce9 100644
--- a/tests/queries/0_stateless/arcadia_skip_list.txt
+++ b/tests/queries/0_stateless/arcadia_skip_list.txt
@@ -141,3 +141,4 @@
 01460_DistributedFilesToInsert
 01474_executable_dictionary
 01474_bad_global_join
+01473_event_time_microseconds

From 489b9c80aca2099e16b0d7380341f69b9633edd9 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 9 Sep 2020 15:18:16 +0300
Subject: [PATCH 143/341] Starting steps

---
 src/Parsers/ASTAlterQuery.h      | 18 ++++++++++++++++++
 src/Parsers/ParserAlterQuery.cpp | 24 ++++++++++++++++--------
 2 files changed, 34 insertions(+), 8 deletions(-)

diff --git a/src/Parsers/ASTAlterQuery.h b/src/Parsers/ASTAlterQuery.h
index df27ba0a3b0..00350d4efa1 100644
--- a/src/Parsers/ASTAlterQuery.h
+++ b/src/Parsers/ASTAlterQuery.h
@@ -28,11 +28,13 @@ public:
         ADD_COLUMN,
         DROP_COLUMN,
         MODIFY_COLUMN,
+        MODIFY_COLUMN_REMOVE_PROPERTY,
         COMMENT_COLUMN,
         RENAME_COLUMN,
         MODIFY_ORDER_BY,
         MODIFY_SAMPLE_BY,
         MODIFY_TTL,
+        REMOVE_TABLE_TTL,
         MATERIALIZE_TTL,
         MODIFY_SETTING,
         MODIFY_QUERY,
@@ -61,6 +63,20 @@ public:
         LIVE_VIEW_REFRESH,
     };
 
+    /// Which property user wants to remove from column
+    enum RemoveProperty
+    {
+        /// Default specifiers
+        DEFAULT,
+        MATERIALIZED,
+        ALIAS,
+
+        /// Other properties
+        COMMENT,
+        CODEC,
+        TTL
+    };
+
     Type type = NO_TYPE;
 
     /** The ADD COLUMN query stores the name and type of the column to add
@@ -167,6 +183,8 @@ public:
     /// Target column name
     ASTPtr rename_to;
 
+    RemoveProperty to_remove;
+
     String getID(char delim) const override { return "AlterCommand" + (delim + std::to_string(static_cast<int>(type))); }
 
     ASTPtr clone() const override;
diff --git a/src/Parsers/ParserAlterQuery.cpp b/src/Parsers/ParserAlterQuery.cpp
index 9930bb649b4..b7bde35139b 100644
--- a/src/Parsers/ParserAlterQuery.cpp
+++ b/src/Parsers/ParserAlterQuery.cpp
@@ -82,6 +82,8 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
     ParserKeyword s_where("WHERE");
     ParserKeyword s_to("TO");
 
+    ParserKeyword s_remove("REMOVE");
+
     ParserCompoundIdentifier parser_name;
     ParserStringLiteral parser_string_literal;
     ParserCompoundColumnDeclaration parser_col_decl;
@@ -430,18 +432,24 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
             if (s_if_exists.ignore(pos, expected))
                 command->if_exists = true;
 
-            if (!parser_modify_col_decl.parse(pos, command->col_decl, expected))
-                return false;
-
-            if (s_first.ignore(pos, expected))
-                command->first = true;
-            else if (s_after.ignore(pos, expected))
+            if (s_remove.ignore(pos, expected))
             {
-                if (!parser_name.parse(pos, command->column, expected))
+            }
+            else
+            {
+                if (!parser_modify_col_decl.parse(pos, command->col_decl, expected))
                     return false;
+
+                if (s_first.ignore(pos, expected))
+                    command->first = true;
+                else if (s_after.ignore(pos, expected))
+                {
+                    if (!parser_name.parse(pos, command->column, expected))
+                        return false;
+                }
+                command->type = ASTAlterCommand::MODIFY_COLUMN;
             }
 
-            command->type = ASTAlterCommand::MODIFY_COLUMN;
         }
         else if (s_modify_order_by.ignore(pos, expected))
         {

From a5f889987412404de0b5578492957e745c86782e Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 16:44:48 +0300
Subject: [PATCH 144/341] First implementation

---
 src/Parsers/ASTAlterQuery.cpp    |  49 +++++++++++--
 src/Parsers/ASTAlterQuery.h      |  34 ++++-----
 src/Parsers/ParserAlterQuery.cpp |  36 +++++++--
 src/Storages/AlterCommands.cpp   | 121 +++++++++++++++++++++++++------
 src/Storages/AlterCommands.h     |  12 +--
 5 files changed, 193 insertions(+), 59 deletions(-)

diff --git a/src/Parsers/ASTAlterQuery.cpp b/src/Parsers/ASTAlterQuery.cpp
index d033cdc79a2..b7a55c58714 100644
--- a/src/Parsers/ASTAlterQuery.cpp
+++ b/src/Parsers/ASTAlterQuery.cpp
@@ -99,12 +99,42 @@ void ASTAlterCommand::formatImpl(
         settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << "MODIFY COLUMN " << (if_exists ? "IF EXISTS " : "") << (settings.hilite ? hilite_none : "");
         col_decl->formatImpl(settings, state, frame);
 
-        if (first)
-            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << " FIRST " << (settings.hilite ? hilite_none : "");
-        else if (column)    /// AFTER
+        if (to_remove != RemoveProperty::NO_PROPERTY)
         {
-            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << " AFTER " << (settings.hilite ? hilite_none : "");
-            column->formatImpl(settings, state, frame);
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << "REMOVE ";
+            switch (to_remove)
+            {
+            case RemoveProperty::DEFAULT:
+                settings.ostr << "DEFAULT";
+                break;
+            case RemoveProperty::MATERIALIZED:
+                settings.ostr << "MATERIALIZED";
+                break;
+            case RemoveProperty::ALIAS:
+                settings.ostr << "ALIAS";
+                break;
+            case RemoveProperty::COMMENT:
+                settings.ostr << "COMMENT";
+                break;
+            case RemoveProperty::CODEC:
+                settings.ostr << "CODEC";
+                break;
+            case RemoveProperty::TTL:
+                settings.ostr << "TTL";
+                break;
+            default:
+                __builtin_unreachable();
+            }
+        }
+        else
+        {
+            if (first)
+                settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << " FIRST " << (settings.hilite ? hilite_none : "");
+            else if (column)    /// AFTER
+            {
+                settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << " AFTER " << (settings.hilite ? hilite_none : "");
+                column->formatImpl(settings, state, frame);
+            }
         }
     }
     else if (type == ASTAlterCommand::COMMENT_COLUMN)
@@ -278,7 +308,14 @@ void ASTAlterCommand::formatImpl(
     else if (type == ASTAlterCommand::MODIFY_TTL)
     {
         settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << "MODIFY TTL " << (settings.hilite ? hilite_none : "");
-        ttl->formatImpl(settings, state, frame);
+        if (ttl)
+        {
+            ttl->formatImpl(settings, state, frame);
+        }
+        else if (to_remove == RemoveProperty::TTL)
+        {
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str<< " REMOVE " << (settings.hilite ? hilite_none : "");
+        }
     }
     else if (type == ASTAlterCommand::MATERIALIZE_TTL)
     {
diff --git a/src/Parsers/ASTAlterQuery.h b/src/Parsers/ASTAlterQuery.h
index 00350d4efa1..a7822806797 100644
--- a/src/Parsers/ASTAlterQuery.h
+++ b/src/Parsers/ASTAlterQuery.h
@@ -9,6 +9,22 @@
 namespace DB
 {
 
+/// Which property user wants to remove from column
+enum class RemoveProperty
+{
+    NO_PROPERTY,
+    /// Default specifiers
+    DEFAULT,
+    MATERIALIZED,
+    ALIAS,
+
+    /// Other properties
+    COMMENT,
+    CODEC,
+    TTL
+};
+
+
 /** ALTER query:
  *  ALTER TABLE [db.]name_type
  *      ADD COLUMN col_name type [AFTER col_after],
@@ -28,13 +44,11 @@ public:
         ADD_COLUMN,
         DROP_COLUMN,
         MODIFY_COLUMN,
-        MODIFY_COLUMN_REMOVE_PROPERTY,
         COMMENT_COLUMN,
         RENAME_COLUMN,
         MODIFY_ORDER_BY,
         MODIFY_SAMPLE_BY,
         MODIFY_TTL,
-        REMOVE_TABLE_TTL,
         MATERIALIZE_TTL,
         MODIFY_SETTING,
         MODIFY_QUERY,
@@ -63,20 +77,6 @@ public:
         LIVE_VIEW_REFRESH,
     };
 
-    /// Which property user wants to remove from column
-    enum RemoveProperty
-    {
-        /// Default specifiers
-        DEFAULT,
-        MATERIALIZED,
-        ALIAS,
-
-        /// Other properties
-        COMMENT,
-        CODEC,
-        TTL
-    };
-
     Type type = NO_TYPE;
 
     /** The ADD COLUMN query stores the name and type of the column to add
@@ -183,7 +183,7 @@ public:
     /// Target column name
     ASTPtr rename_to;
 
-    RemoveProperty to_remove;
+    RemoveProperty to_remove = RemoveProperty::NO_PROPERTY;
 
     String getID(char delim) const override { return "AlterCommand" + (delim + std::to_string(static_cast<int>(type))); }
 
diff --git a/src/Parsers/ParserAlterQuery.cpp b/src/Parsers/ParserAlterQuery.cpp
index b7bde35139b..4a1418cbe6a 100644
--- a/src/Parsers/ParserAlterQuery.cpp
+++ b/src/Parsers/ParserAlterQuery.cpp
@@ -83,6 +83,12 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
     ParserKeyword s_to("TO");
 
     ParserKeyword s_remove("REMOVE");
+    ParserKeyword s_default("DEFAULT");
+    ParserKeyword s_materialized("MATERIALIZED");
+    ParserKeyword s_alias("ALIAS");
+    ParserKeyword s_comment("COMMENT");
+    ParserKeyword s_codec("CODEC");
+    ParserKeyword s_ttl("TTL");
 
     ParserCompoundIdentifier parser_name;
     ParserStringLiteral parser_string_literal;
@@ -432,14 +438,28 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
             if (s_if_exists.ignore(pos, expected))
                 command->if_exists = true;
 
+            if (!parser_modify_col_decl.parse(pos, command->col_decl, expected))
+                return false;
+
             if (s_remove.ignore(pos, expected))
             {
+                if (s_default.ignore(pos, expected))
+                    command->to_remove = RemoveProperty::DEFAULT;
+                else if (s_materialized.ignore(pos, expected))
+                    command->to_remove = RemoveProperty::MATERIALIZED;
+                else if (s_alias.ignore(pos, expected))
+                    command->to_remove = RemoveProperty::ALIAS;
+                else if (s_comment.ignore(pos, expected))
+                    command->to_remove = RemoveProperty::COMMENT;
+                else if (s_codec.ignore(pos, expected))
+                    command->to_remove = RemoveProperty::CODEC;
+                else if (s_ttl.ignore(pos, expected))
+                    command->to_remove = RemoveProperty::TTL;
+                else
+                    return false;
             }
             else
             {
-                if (!parser_modify_col_decl.parse(pos, command->col_decl, expected))
-                    return false;
-
                 if (s_first.ignore(pos, expected))
                     command->first = true;
                 else if (s_after.ignore(pos, expected))
@@ -447,9 +467,8 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
                     if (!parser_name.parse(pos, command->column, expected))
                         return false;
                 }
-                command->type = ASTAlterCommand::MODIFY_COLUMN;
             }
-
+            command->type = ASTAlterCommand::MODIFY_COLUMN;
         }
         else if (s_modify_order_by.ignore(pos, expected))
         {
@@ -501,7 +520,12 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
         else if (s_modify_ttl.ignore(pos, expected))
         {
             if (!parser_ttl_list.parse(pos, command->ttl, expected))
-                return false;
+            {
+                if (s_remove.ignore(pos, expected))
+                    command->to_remove = RemoveProperty::TTL;
+                else
+                    return false;
+            }
             command->type = ASTAlterCommand::MODIFY_TTL;
         }
         else if (s_materialize_ttl.ignore(pos, expected))
diff --git a/src/Storages/AlterCommands.cpp b/src/Storages/AlterCommands.cpp
index caf98e911ab..5c7a45a27be 100644
--- a/src/Storages/AlterCommands.cpp
+++ b/src/Storages/AlterCommands.cpp
@@ -113,6 +113,8 @@ std::optional<AlterCommand> AlterCommand::parse(const ASTAlterCommand * command_
         const auto & ast_col_decl = command_ast->col_decl->as<ASTColumnDeclaration &>();
 
         command.column_name = ast_col_decl.name;
+        command.to_remove = command_ast->to_remove;
+
         if (ast_col_decl.type)
         {
             command.data_type = data_type_factory.get(ast_col_decl.type);
@@ -301,24 +303,45 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, const Context & con
     {
         metadata.columns.modify(column_name, after_column, first, [&](ColumnDescription & column)
         {
-            if (codec)
-                column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(codec, data_type ? data_type : column.type, false);
-
-            if (comment)
-                column.comment = *comment;
-
-            if (ttl)
-                column.ttl = ttl;
-
-            if (data_type)
-                column.type = data_type;
-
-            /// User specified default expression or changed
-            /// datatype. We have to replace default.
-            if (default_expression || data_type)
+            if (to_remove == RemoveProperty::DEFAULT
+                || to_remove == RemoveProperty::MATERIALIZED
+                || to_remove == RemoveProperty::ALIAS)
             {
-                column.default_desc.kind = default_kind;
-                column.default_desc.expression = default_expression;
+                column.default_desc = ColumnDefault{};
+            }
+            else if (to_remove == RemoveProperty::CODEC)
+            {
+                column.codec.reset();
+            }
+            else if (to_remove == RemoveProperty::COMMENT)
+            {
+                column.comment = String{};
+            }
+            else if (to_remove == RemoveProperty::TTL)
+            {
+                column.ttl.reset();
+            }
+            else
+            {
+                if (codec)
+                    column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(codec, data_type ? data_type : column.type, false);
+
+                if (comment)
+                    column.comment = *comment;
+
+                if (ttl)
+                    column.ttl = ttl;
+
+                if (data_type)
+                    column.type = data_type;
+
+                /// User specified default expression or changed
+                /// datatype. We have to replace default.
+                if (default_expression || data_type)
+                {
+                    column.default_desc.kind = default_kind;
+                    column.default_desc.expression = default_expression;
+                }
             }
         });
 
@@ -448,7 +471,10 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, const Context & con
     }
     else if (type == MODIFY_TTL)
     {
-        metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(ttl, metadata.columns, context, metadata.primary_key);
+        if (to_remove == RemoveProperty::TTL)
+            metadata.table_ttl = TTLTableDescription{};
+        else
+            metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(ttl, metadata.columns, context, metadata.primary_key);
     }
     else if (type == MODIFY_QUERY)
     {
@@ -590,6 +616,10 @@ bool AlterCommand::isRequireMutationStage(const StorageInMemoryMetadata & metada
     if (type != MODIFY_COLUMN || data_type == nullptr)
         return false;
 
+    /// We remove properties on metadata level
+    if (type == MODIFY_COLUMN && to_remove != RemoveProperty::NO_PROPERTY)
+        return false;
+
     for (const auto & column : metadata.columns.getAllPhysical())
     {
         if (column.name == column_name && !isMetadataOnlyConversion(column.type.get(), data_type.get()))
@@ -783,14 +813,30 @@ void AlterCommands::prepare(const StorageInMemoryMetadata & metadata)
             if (!has_column && command.if_exists)
                 command.ignore = true;
 
-            if (has_column && command.data_type)
+            if (has_column)
             {
                 auto column_from_table = columns.get(command.column_name);
-                if (!command.default_expression && column_from_table.default_desc.expression)
+                if (command.to_remove != RemoveProperty::NO_PROPERTY)
+                {
+                    auto column_default = columns.getDefault(command.column_name);
+                    if (!column_default
+                        && (command.to_remove == RemoveProperty::ALIAS || command.to_remove == RemoveProperty::DEFAULT
+                            || command.to_remove == RemoveProperty::MATERIALIZED))
+                        command.ignore = true;
+
+                    if (command.to_remove == RemoveProperty::TTL && column_from_table.ttl == nullptr)
+                        command.ignore = true;
+                    if (command.to_remove == RemoveProperty::COMMENT && column_from_table.comment == "")
+                        command.ignore = true;
+                    if (command.to_remove == RemoveProperty::CODEC && column_from_table.codec == nullptr)
+                        command.ignore = true;
+                }
+                else if (command.data_type && !command.default_expression && column_from_table.default_desc.expression)
                 {
                     command.default_kind = column_from_table.default_desc.kind;
                     command.default_expression = column_from_table.default_desc.expression;
                 }
+
             }
         }
         else if (command.type == AlterCommand::ADD_COLUMN)
@@ -805,6 +851,11 @@ void AlterCommands::prepare(const StorageInMemoryMetadata & metadata)
             if (!has_column && command.if_exists)
                 command.ignore = true;
         }
+        else if (command.type == AlterCommand::MODIFY_TTL)
+        {
+            if (!metadata.hasAnyTTL())
+                command.ignore = true;
+        }
     }
     prepared = true;
 }
@@ -857,6 +908,34 @@ void AlterCommands::validate(const StorageInMemoryMetadata & metadata, const Con
 
             if (command.codec)
                 CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(command.codec, command.data_type, !context.getSettingsRef().allow_suspicious_codecs);
+            auto column_default = all_columns.getDefault(column_name);
+            if (column_default)
+            {
+                if (command.to_remove == RemoveProperty::DEFAULT && column_default->kind != ColumnDefaultKind::Default)
+                {
+                    throw Exception{
+                        ErrorCodes::BAD_ARGUMENTS,
+                        "Cannot remove DEFAULT from column {}, because column default type is {}. Use REMOVE {} to delete it.",
+                            backQuote(column_name), toString(column_default->kind), toString(column_default->kind)
+                    };
+                }
+                if (command.to_remove == RemoveProperty::MATERIALIZED && column_default->kind != ColumnDefaultKind::Materialized)
+                {
+                    throw Exception{
+                        ErrorCodes::BAD_ARGUMENTS,
+                        "Cannot remove MATERIALIZED from column {}, because column default type is {}. Use REMOVE {} to delete it.",
+                            backQuote(column_name), toString(column_default->kind), toString(column_default->kind)
+                    };
+                }
+                if (command.to_remove == RemoveProperty::ALIAS && column_default->kind != ColumnDefaultKind::Alias)
+                {
+                    throw Exception{
+                        ErrorCodes::BAD_ARGUMENTS,
+                        "Cannot remove ALIAS from column {}, because column default type is {}. Use REMOVE {} to delete it.",
+                            backQuote(column_name), toString(column_default->kind), toString(column_default->kind)
+                    };
+                }
+            }
 
             modified_columns.emplace(column_name);
         }
@@ -1048,7 +1127,7 @@ MutationCommands AlterCommands::getMutationCommands(StorageInMemoryMetadata meta
     {
         for (const auto & alter_cmd : *this)
         {
-            if (alter_cmd.isTTLAlter(metadata))
+            if (alter_cmd.isTTLAlter(metadata) && alter_cmd.to_remove != RemoveProperty::TTL)
             {
                 result.push_back(createMaterializeTTLCommand());
                 break;
diff --git a/src/Storages/AlterCommands.h b/src/Storages/AlterCommands.h
index 3578507a361..a4eff5523b7 100644
--- a/src/Storages/AlterCommands.h
+++ b/src/Storages/AlterCommands.h
@@ -107,16 +107,13 @@ struct AlterCommand
     /// Target column name
     String rename_to;
 
+    /// What to remove from column (or TTL)
+    RemoveProperty to_remove;
+
     static std::optional<AlterCommand> parse(const ASTAlterCommand * command);
 
     void apply(StorageInMemoryMetadata & metadata, const Context & context) const;
 
-    /// Checks that alter query changes data. For MergeTree:
-    ///    * column files (data and marks)
-    ///    * each part meta (columns.txt)
-    /// in each part on disk (it's not lightweight alter).
-    bool isModifyingData(const StorageInMemoryMetadata & metadata) const;
-
     /// Check that alter command require data modification (mutation) to be
     /// executed. For example, cast from Date to UInt16 type can be executed
     /// without any data modifications. But column drop or modify from UInt16 to
@@ -164,9 +161,6 @@ public:
     /// Commands have to be prepared before apply.
     void apply(StorageInMemoryMetadata & metadata, const Context & context) const;
 
-    /// At least one command modify data on disk.
-    bool isModifyingData(const StorageInMemoryMetadata & metadata) const;
-
     /// At least one command modify settings.
     bool isSettingsAlter() const;
 

From a4c43e51b91eef3bf8337653dfec36478ad95ca7 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 17:56:09 +0300
Subject: [PATCH 145/341] Add a test

---
 src/Parsers/ASTAlterQuery.cpp                 |  2 +-
 src/Parsers/ParserAlterQuery.cpp              | 12 +++-
 src/Storages/AlterCommands.cpp                |  1 -
 .../01493_alter_remove_properties.reference   | 17 ++++++
 .../01493_alter_remove_properties.sql         | 58 +++++++++++++++++++
 5 files changed, 87 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/01493_alter_remove_properties.reference
 create mode 100644 tests/queries/0_stateless/01493_alter_remove_properties.sql

diff --git a/src/Parsers/ASTAlterQuery.cpp b/src/Parsers/ASTAlterQuery.cpp
index b7a55c58714..62f33b25c57 100644
--- a/src/Parsers/ASTAlterQuery.cpp
+++ b/src/Parsers/ASTAlterQuery.cpp
@@ -101,7 +101,7 @@ void ASTAlterCommand::formatImpl(
 
         if (to_remove != RemoveProperty::NO_PROPERTY)
         {
-            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << "REMOVE ";
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << " REMOVE ";
             switch (to_remove)
             {
             case RemoveProperty::DEFAULT:
diff --git a/src/Parsers/ParserAlterQuery.cpp b/src/Parsers/ParserAlterQuery.cpp
index 4a1418cbe6a..4d6e71e95cf 100644
--- a/src/Parsers/ParserAlterQuery.cpp
+++ b/src/Parsers/ParserAlterQuery.cpp
@@ -438,7 +438,9 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
             if (s_if_exists.ignore(pos, expected))
                 command->if_exists = true;
 
-            if (!parser_modify_col_decl.parse(pos, command->col_decl, expected))
+            ASTPtr column_name;
+            Pos stop_pos = pos;
+            if (!parser_name.parse(pos, column_name, expected))
                 return false;
 
             if (s_remove.ignore(pos, expected))
@@ -457,9 +459,17 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
                     command->to_remove = RemoveProperty::TTL;
                 else
                     return false;
+
+                auto column_declaration = std::make_shared<ASTColumnDeclaration>();
+                tryGetIdentifierNameInto(column_name, column_declaration->name);
+                command->col_decl = column_declaration;
             }
             else
             {
+                pos = stop_pos;
+                if (!parser_modify_col_decl.parse(pos, command->col_decl, expected))
+                    return false;
+
                 if (s_first.ignore(pos, expected))
                     command->first = true;
                 else if (s_after.ignore(pos, expected))
diff --git a/src/Storages/AlterCommands.cpp b/src/Storages/AlterCommands.cpp
index 5c7a45a27be..bc6455ef420 100644
--- a/src/Storages/AlterCommands.cpp
+++ b/src/Storages/AlterCommands.cpp
@@ -111,7 +111,6 @@ std::optional<AlterCommand> AlterCommand::parse(const ASTAlterCommand * command_
         command.type = AlterCommand::MODIFY_COLUMN;
 
         const auto & ast_col_decl = command_ast->col_decl->as<ASTColumnDeclaration &>();
-
         command.column_name = ast_col_decl.name;
         command.to_remove = command_ast->to_remove;
 
diff --git a/tests/queries/0_stateless/01493_alter_remove_properties.reference b/tests/queries/0_stateless/01493_alter_remove_properties.reference
new file mode 100644
index 00000000000..4ce7a574742
--- /dev/null
+++ b/tests/queries/0_stateless/01493_alter_remove_properties.reference
@@ -0,0 +1,17 @@
+CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64 MATERIALIZED column_default * 42,\n    `column_alias` UInt64 ALIAS column_default + 1,\n    `column_codec` String CODEC(ZSTD(10)),\n    `column_comment` Date COMMENT \'Some comment\',\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
+42	1764	43	str	2019-10-01	1
+CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64 MATERIALIZED column_default * 42,\n    `column_alias` UInt64 ALIAS column_default + 1,\n    `column_codec` String CODEC(ZSTD(10)),\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
+CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64 MATERIALIZED column_default * 42,\n    `column_alias` UInt64 ALIAS column_default + 1,\n    `column_codec` String,\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
+42	1764	0	str	2019-10-01	1
+CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64 MATERIALIZED column_default * 42,\n    `column_alias` UInt64,\n    `column_codec` String,\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
+42	1764	0	str	2019-10-01	1
+42	1764	33	trs	2020-01-01	2
+CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64,\n    `column_alias` UInt64,\n    `column_codec` String,\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
+42	1764	0	str	2019-10-01	1
+42	1764	33	trs	2020-01-01	2
+42	11	44	rts	2020-02-01	3
+CREATE TABLE default.prop_table\n(\n    `column_default` UInt64,\n    `column_materialized` UInt64,\n    `column_alias` UInt64,\n    `column_codec` String,\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
+42	1764	0	str	2019-10-01	1
+42	1764	33	trs	2020-01-01	2
+42	11	44	rts	2020-02-01	3
+0	22	55	tsr	2020-03-01	4
diff --git a/tests/queries/0_stateless/01493_alter_remove_properties.sql b/tests/queries/0_stateless/01493_alter_remove_properties.sql
new file mode 100644
index 00000000000..25000a50235
--- /dev/null
+++ b/tests/queries/0_stateless/01493_alter_remove_properties.sql
@@ -0,0 +1,58 @@
+DROP TABLE IF EXISTS prop_table;
+
+CREATE TABLE prop_table
+(
+    column_default UInt64 DEFAULT 42,
+    column_materialized UInt64 MATERIALIZED column_default * 42,
+    column_alias UInt64 ALIAS column_default + 1,
+    column_codec String CODEC(ZSTD(10)),
+    column_comment Date COMMENT 'Some comment',
+    column_ttl UInt64 TTL column_comment + INTERVAL 1 MONTH
+)
+ENGINE MergeTree()
+ORDER BY tuple()
+TTL column_comment + INTERVAL 2 MONTH;
+
+SHOW CREATE TABLE prop_table;
+
+SYSTEM STOP TTL MERGES prop_table;
+
+INSERT INTO prop_table (column_codec, column_comment, column_ttl) VALUES ('str', toDate('2019-10-01'), 1);
+
+SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table;
+
+ALTER TABLE prop_table MODIFY COLUMN column_comment REMOVE COMMENT;
+
+SHOW CREATE TABLE prop_table;
+
+ALTER TABLE prop_table MODIFY COLUMN column_codec REMOVE CODEC;
+
+SHOW CREATE TABLE prop_table;
+
+ALTER TABLE prop_table MODIFY COLUMN column_alias REMOVE ALIAS;
+
+SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table;
+
+SHOW CREATE TABLE prop_table;
+
+INSERT INTO prop_table (column_alias, column_codec, column_comment, column_ttl) VALUES (33, 'trs', toDate('2020-01-01'), 2);
+
+SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table ORDER BY column_ttl;
+
+ALTER TABLE prop_table MODIFY COLUMN column_materialized REMOVE MATERIALIZED;
+
+SHOW CREATE TABLE prop_table;
+
+INSERT INTO prop_table (column_materialized, column_alias, column_codec, column_comment, column_ttl) VALUES (11, 44, 'rts', toDate('2020-02-01'), 3);
+
+SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table ORDER BY column_ttl;
+
+ALTER TABLE prop_table MODIFY COLUMN column_default REMOVE DEFAULT;
+
+SHOW CREATE TABLE prop_table;
+
+INSERT INTO prop_table (column_materialized, column_alias, column_codec, column_comment, column_ttl) VALUES (22, 55, 'tsr', toDate('2020-03-01'), 4);
+
+SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table ORDER BY column_ttl;
+
+DROP TABLE IF EXISTS prop_table;

From 6dd75182f07310a5fa5a0fd72618969ac51d9dad Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 19:21:08 +0300
Subject: [PATCH 146/341] Better

---
 src/Parsers/ParserAlterQuery.cpp | 11 ++++-------
 src/Storages/AlterCommands.cpp   |  2 +-
 2 files changed, 5 insertions(+), 8 deletions(-)

diff --git a/src/Parsers/ParserAlterQuery.cpp b/src/Parsers/ParserAlterQuery.cpp
index 4d6e71e95cf..a6032bd38db 100644
--- a/src/Parsers/ParserAlterQuery.cpp
+++ b/src/Parsers/ParserAlterQuery.cpp
@@ -529,13 +529,10 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
         }
         else if (s_modify_ttl.ignore(pos, expected))
         {
-            if (!parser_ttl_list.parse(pos, command->ttl, expected))
-            {
-                if (s_remove.ignore(pos, expected))
-                    command->to_remove = RemoveProperty::TTL;
-                else
-                    return false;
-            }
+            if (s_remove.ignore(pos, expected))
+                command->to_remove = RemoveProperty::TTL;
+            else if (!parser_ttl_list.parse(pos, command->ttl, expected))
+                return false;
             command->type = ASTAlterCommand::MODIFY_TTL;
         }
         else if (s_materialize_ttl.ignore(pos, expected))
diff --git a/src/Storages/AlterCommands.cpp b/src/Storages/AlterCommands.cpp
index bc6455ef420..01b56e0e128 100644
--- a/src/Storages/AlterCommands.cpp
+++ b/src/Storages/AlterCommands.cpp
@@ -825,7 +825,7 @@ void AlterCommands::prepare(const StorageInMemoryMetadata & metadata)
 
                     if (command.to_remove == RemoveProperty::TTL && column_from_table.ttl == nullptr)
                         command.ignore = true;
-                    if (command.to_remove == RemoveProperty::COMMENT && column_from_table.comment == "")
+                    if (command.to_remove == RemoveProperty::COMMENT && column_from_table.comment.empty())
                         command.ignore = true;
                     if (command.to_remove == RemoveProperty::CODEC && column_from_table.codec == nullptr)
                         command.ignore = true;

From c0dafb0283d52d6a9df714105c75d1e8d00603a0 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 20:04:41 +0300
Subject: [PATCH 147/341] Disable test

---
 tests/integration/test_adaptive_granularity/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_adaptive_granularity/test.py b/tests/integration/test_adaptive_granularity/test.py
index 21d65588de4..d5ac91671e0 100644
--- a/tests/integration/test_adaptive_granularity/test.py
+++ b/tests/integration/test_adaptive_granularity/test.py
@@ -298,7 +298,7 @@ def test_mixed_granularity_single_node(start_dynamic_cluster, node):
     #still works
     assert node.query("SELECT count() from table_with_default_granularity") == '6\n'
 
-
+@pytest.mark.skip(reason="flaky")
 def test_version_update_two_nodes(start_dynamic_cluster):
     node11.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
     node12.query("SYSTEM SYNC REPLICA table_with_default_granularity", timeout=20)

From 2c4047b280555df2ef2f50240eeb519d4dde1154 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 20:07:00 +0300
Subject: [PATCH 148/341] Revert accident changes

---
 src/Parsers/ASTAlterQuery.cpp                 |  49 +-------
 src/Parsers/ASTAlterQuery.h                   |  18 ---
 src/Parsers/ParserAlterQuery.cpp              |  51 +-------
 src/Storages/AlterCommands.cpp                | 116 +++---------------
 src/Storages/AlterCommands.h                  |  12 +-
 .../test_adaptive_granularity/test.py         |   2 +-
 .../01493_alter_remove_properties.reference   |  17 ---
 .../01493_alter_remove_properties.sql         |  58 ---------
 8 files changed, 41 insertions(+), 282 deletions(-)
 delete mode 100644 tests/queries/0_stateless/01493_alter_remove_properties.reference
 delete mode 100644 tests/queries/0_stateless/01493_alter_remove_properties.sql

diff --git a/src/Parsers/ASTAlterQuery.cpp b/src/Parsers/ASTAlterQuery.cpp
index 62f33b25c57..d033cdc79a2 100644
--- a/src/Parsers/ASTAlterQuery.cpp
+++ b/src/Parsers/ASTAlterQuery.cpp
@@ -99,42 +99,12 @@ void ASTAlterCommand::formatImpl(
         settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << "MODIFY COLUMN " << (if_exists ? "IF EXISTS " : "") << (settings.hilite ? hilite_none : "");
         col_decl->formatImpl(settings, state, frame);
 
-        if (to_remove != RemoveProperty::NO_PROPERTY)
+        if (first)
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << " FIRST " << (settings.hilite ? hilite_none : "");
+        else if (column)    /// AFTER
         {
-            settings.ostr << (settings.hilite ? hilite_keyword : "") << " REMOVE ";
-            switch (to_remove)
-            {
-            case RemoveProperty::DEFAULT:
-                settings.ostr << "DEFAULT";
-                break;
-            case RemoveProperty::MATERIALIZED:
-                settings.ostr << "MATERIALIZED";
-                break;
-            case RemoveProperty::ALIAS:
-                settings.ostr << "ALIAS";
-                break;
-            case RemoveProperty::COMMENT:
-                settings.ostr << "COMMENT";
-                break;
-            case RemoveProperty::CODEC:
-                settings.ostr << "CODEC";
-                break;
-            case RemoveProperty::TTL:
-                settings.ostr << "TTL";
-                break;
-            default:
-                __builtin_unreachable();
-            }
-        }
-        else
-        {
-            if (first)
-                settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << " FIRST " << (settings.hilite ? hilite_none : "");
-            else if (column)    /// AFTER
-            {
-                settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << " AFTER " << (settings.hilite ? hilite_none : "");
-                column->formatImpl(settings, state, frame);
-            }
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << " AFTER " << (settings.hilite ? hilite_none : "");
+            column->formatImpl(settings, state, frame);
         }
     }
     else if (type == ASTAlterCommand::COMMENT_COLUMN)
@@ -308,14 +278,7 @@ void ASTAlterCommand::formatImpl(
     else if (type == ASTAlterCommand::MODIFY_TTL)
     {
         settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << "MODIFY TTL " << (settings.hilite ? hilite_none : "");
-        if (ttl)
-        {
-            ttl->formatImpl(settings, state, frame);
-        }
-        else if (to_remove == RemoveProperty::TTL)
-        {
-            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str<< " REMOVE " << (settings.hilite ? hilite_none : "");
-        }
+        ttl->formatImpl(settings, state, frame);
     }
     else if (type == ASTAlterCommand::MATERIALIZE_TTL)
     {
diff --git a/src/Parsers/ASTAlterQuery.h b/src/Parsers/ASTAlterQuery.h
index a7822806797..df27ba0a3b0 100644
--- a/src/Parsers/ASTAlterQuery.h
+++ b/src/Parsers/ASTAlterQuery.h
@@ -9,22 +9,6 @@
 namespace DB
 {
 
-/// Which property user wants to remove from column
-enum class RemoveProperty
-{
-    NO_PROPERTY,
-    /// Default specifiers
-    DEFAULT,
-    MATERIALIZED,
-    ALIAS,
-
-    /// Other properties
-    COMMENT,
-    CODEC,
-    TTL
-};
-
-
 /** ALTER query:
  *  ALTER TABLE [db.]name_type
  *      ADD COLUMN col_name type [AFTER col_after],
@@ -183,8 +167,6 @@ public:
     /// Target column name
     ASTPtr rename_to;
 
-    RemoveProperty to_remove = RemoveProperty::NO_PROPERTY;
-
     String getID(char delim) const override { return "AlterCommand" + (delim + std::to_string(static_cast<int>(type))); }
 
     ASTPtr clone() const override;
diff --git a/src/Parsers/ParserAlterQuery.cpp b/src/Parsers/ParserAlterQuery.cpp
index a6032bd38db..9930bb649b4 100644
--- a/src/Parsers/ParserAlterQuery.cpp
+++ b/src/Parsers/ParserAlterQuery.cpp
@@ -82,14 +82,6 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
     ParserKeyword s_where("WHERE");
     ParserKeyword s_to("TO");
 
-    ParserKeyword s_remove("REMOVE");
-    ParserKeyword s_default("DEFAULT");
-    ParserKeyword s_materialized("MATERIALIZED");
-    ParserKeyword s_alias("ALIAS");
-    ParserKeyword s_comment("COMMENT");
-    ParserKeyword s_codec("CODEC");
-    ParserKeyword s_ttl("TTL");
-
     ParserCompoundIdentifier parser_name;
     ParserStringLiteral parser_string_literal;
     ParserCompoundColumnDeclaration parser_col_decl;
@@ -438,46 +430,17 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
             if (s_if_exists.ignore(pos, expected))
                 command->if_exists = true;
 
-            ASTPtr column_name;
-            Pos stop_pos = pos;
-            if (!parser_name.parse(pos, column_name, expected))
+            if (!parser_modify_col_decl.parse(pos, command->col_decl, expected))
                 return false;
 
-            if (s_remove.ignore(pos, expected))
+            if (s_first.ignore(pos, expected))
+                command->first = true;
+            else if (s_after.ignore(pos, expected))
             {
-                if (s_default.ignore(pos, expected))
-                    command->to_remove = RemoveProperty::DEFAULT;
-                else if (s_materialized.ignore(pos, expected))
-                    command->to_remove = RemoveProperty::MATERIALIZED;
-                else if (s_alias.ignore(pos, expected))
-                    command->to_remove = RemoveProperty::ALIAS;
-                else if (s_comment.ignore(pos, expected))
-                    command->to_remove = RemoveProperty::COMMENT;
-                else if (s_codec.ignore(pos, expected))
-                    command->to_remove = RemoveProperty::CODEC;
-                else if (s_ttl.ignore(pos, expected))
-                    command->to_remove = RemoveProperty::TTL;
-                else
+                if (!parser_name.parse(pos, command->column, expected))
                     return false;
-
-                auto column_declaration = std::make_shared<ASTColumnDeclaration>();
-                tryGetIdentifierNameInto(column_name, column_declaration->name);
-                command->col_decl = column_declaration;
             }
-            else
-            {
-                pos = stop_pos;
-                if (!parser_modify_col_decl.parse(pos, command->col_decl, expected))
-                    return false;
 
-                if (s_first.ignore(pos, expected))
-                    command->first = true;
-                else if (s_after.ignore(pos, expected))
-                {
-                    if (!parser_name.parse(pos, command->column, expected))
-                        return false;
-                }
-            }
             command->type = ASTAlterCommand::MODIFY_COLUMN;
         }
         else if (s_modify_order_by.ignore(pos, expected))
@@ -529,9 +492,7 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
         }
         else if (s_modify_ttl.ignore(pos, expected))
         {
-            if (s_remove.ignore(pos, expected))
-                command->to_remove = RemoveProperty::TTL;
-            else if (!parser_ttl_list.parse(pos, command->ttl, expected))
+            if (!parser_ttl_list.parse(pos, command->ttl, expected))
                 return false;
             command->type = ASTAlterCommand::MODIFY_TTL;
         }
diff --git a/src/Storages/AlterCommands.cpp b/src/Storages/AlterCommands.cpp
index 01b56e0e128..caf98e911ab 100644
--- a/src/Storages/AlterCommands.cpp
+++ b/src/Storages/AlterCommands.cpp
@@ -111,9 +111,8 @@ std::optional<AlterCommand> AlterCommand::parse(const ASTAlterCommand * command_
         command.type = AlterCommand::MODIFY_COLUMN;
 
         const auto & ast_col_decl = command_ast->col_decl->as<ASTColumnDeclaration &>();
-        command.column_name = ast_col_decl.name;
-        command.to_remove = command_ast->to_remove;
 
+        command.column_name = ast_col_decl.name;
         if (ast_col_decl.type)
         {
             command.data_type = data_type_factory.get(ast_col_decl.type);
@@ -302,45 +301,24 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, const Context & con
     {
         metadata.columns.modify(column_name, after_column, first, [&](ColumnDescription & column)
         {
-            if (to_remove == RemoveProperty::DEFAULT
-                || to_remove == RemoveProperty::MATERIALIZED
-                || to_remove == RemoveProperty::ALIAS)
-            {
-                column.default_desc = ColumnDefault{};
-            }
-            else if (to_remove == RemoveProperty::CODEC)
-            {
-                column.codec.reset();
-            }
-            else if (to_remove == RemoveProperty::COMMENT)
-            {
-                column.comment = String{};
-            }
-            else if (to_remove == RemoveProperty::TTL)
-            {
-                column.ttl.reset();
-            }
-            else
-            {
-                if (codec)
-                    column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(codec, data_type ? data_type : column.type, false);
+            if (codec)
+                column.codec = CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(codec, data_type ? data_type : column.type, false);
 
-                if (comment)
-                    column.comment = *comment;
+            if (comment)
+                column.comment = *comment;
 
-                if (ttl)
-                    column.ttl = ttl;
+            if (ttl)
+                column.ttl = ttl;
 
-                if (data_type)
-                    column.type = data_type;
+            if (data_type)
+                column.type = data_type;
 
-                /// User specified default expression or changed
-                /// datatype. We have to replace default.
-                if (default_expression || data_type)
-                {
-                    column.default_desc.kind = default_kind;
-                    column.default_desc.expression = default_expression;
-                }
+            /// User specified default expression or changed
+            /// datatype. We have to replace default.
+            if (default_expression || data_type)
+            {
+                column.default_desc.kind = default_kind;
+                column.default_desc.expression = default_expression;
             }
         });
 
@@ -470,10 +448,7 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, const Context & con
     }
     else if (type == MODIFY_TTL)
     {
-        if (to_remove == RemoveProperty::TTL)
-            metadata.table_ttl = TTLTableDescription{};
-        else
-            metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(ttl, metadata.columns, context, metadata.primary_key);
+        metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(ttl, metadata.columns, context, metadata.primary_key);
     }
     else if (type == MODIFY_QUERY)
     {
@@ -615,10 +590,6 @@ bool AlterCommand::isRequireMutationStage(const StorageInMemoryMetadata & metada
     if (type != MODIFY_COLUMN || data_type == nullptr)
         return false;
 
-    /// We remove properties on metadata level
-    if (type == MODIFY_COLUMN && to_remove != RemoveProperty::NO_PROPERTY)
-        return false;
-
     for (const auto & column : metadata.columns.getAllPhysical())
     {
         if (column.name == column_name && !isMetadataOnlyConversion(column.type.get(), data_type.get()))
@@ -812,30 +783,14 @@ void AlterCommands::prepare(const StorageInMemoryMetadata & metadata)
             if (!has_column && command.if_exists)
                 command.ignore = true;
 
-            if (has_column)
+            if (has_column && command.data_type)
             {
                 auto column_from_table = columns.get(command.column_name);
-                if (command.to_remove != RemoveProperty::NO_PROPERTY)
-                {
-                    auto column_default = columns.getDefault(command.column_name);
-                    if (!column_default
-                        && (command.to_remove == RemoveProperty::ALIAS || command.to_remove == RemoveProperty::DEFAULT
-                            || command.to_remove == RemoveProperty::MATERIALIZED))
-                        command.ignore = true;
-
-                    if (command.to_remove == RemoveProperty::TTL && column_from_table.ttl == nullptr)
-                        command.ignore = true;
-                    if (command.to_remove == RemoveProperty::COMMENT && column_from_table.comment.empty())
-                        command.ignore = true;
-                    if (command.to_remove == RemoveProperty::CODEC && column_from_table.codec == nullptr)
-                        command.ignore = true;
-                }
-                else if (command.data_type && !command.default_expression && column_from_table.default_desc.expression)
+                if (!command.default_expression && column_from_table.default_desc.expression)
                 {
                     command.default_kind = column_from_table.default_desc.kind;
                     command.default_expression = column_from_table.default_desc.expression;
                 }
-
             }
         }
         else if (command.type == AlterCommand::ADD_COLUMN)
@@ -850,11 +805,6 @@ void AlterCommands::prepare(const StorageInMemoryMetadata & metadata)
             if (!has_column && command.if_exists)
                 command.ignore = true;
         }
-        else if (command.type == AlterCommand::MODIFY_TTL)
-        {
-            if (!metadata.hasAnyTTL())
-                command.ignore = true;
-        }
     }
     prepared = true;
 }
@@ -907,34 +857,6 @@ void AlterCommands::validate(const StorageInMemoryMetadata & metadata, const Con
 
             if (command.codec)
                 CompressionCodecFactory::instance().validateCodecAndGetPreprocessedAST(command.codec, command.data_type, !context.getSettingsRef().allow_suspicious_codecs);
-            auto column_default = all_columns.getDefault(column_name);
-            if (column_default)
-            {
-                if (command.to_remove == RemoveProperty::DEFAULT && column_default->kind != ColumnDefaultKind::Default)
-                {
-                    throw Exception{
-                        ErrorCodes::BAD_ARGUMENTS,
-                        "Cannot remove DEFAULT from column {}, because column default type is {}. Use REMOVE {} to delete it.",
-                            backQuote(column_name), toString(column_default->kind), toString(column_default->kind)
-                    };
-                }
-                if (command.to_remove == RemoveProperty::MATERIALIZED && column_default->kind != ColumnDefaultKind::Materialized)
-                {
-                    throw Exception{
-                        ErrorCodes::BAD_ARGUMENTS,
-                        "Cannot remove MATERIALIZED from column {}, because column default type is {}. Use REMOVE {} to delete it.",
-                            backQuote(column_name), toString(column_default->kind), toString(column_default->kind)
-                    };
-                }
-                if (command.to_remove == RemoveProperty::ALIAS && column_default->kind != ColumnDefaultKind::Alias)
-                {
-                    throw Exception{
-                        ErrorCodes::BAD_ARGUMENTS,
-                        "Cannot remove ALIAS from column {}, because column default type is {}. Use REMOVE {} to delete it.",
-                            backQuote(column_name), toString(column_default->kind), toString(column_default->kind)
-                    };
-                }
-            }
 
             modified_columns.emplace(column_name);
         }
@@ -1126,7 +1048,7 @@ MutationCommands AlterCommands::getMutationCommands(StorageInMemoryMetadata meta
     {
         for (const auto & alter_cmd : *this)
         {
-            if (alter_cmd.isTTLAlter(metadata) && alter_cmd.to_remove != RemoveProperty::TTL)
+            if (alter_cmd.isTTLAlter(metadata))
             {
                 result.push_back(createMaterializeTTLCommand());
                 break;
diff --git a/src/Storages/AlterCommands.h b/src/Storages/AlterCommands.h
index a4eff5523b7..3578507a361 100644
--- a/src/Storages/AlterCommands.h
+++ b/src/Storages/AlterCommands.h
@@ -107,13 +107,16 @@ struct AlterCommand
     /// Target column name
     String rename_to;
 
-    /// What to remove from column (or TTL)
-    RemoveProperty to_remove;
-
     static std::optional<AlterCommand> parse(const ASTAlterCommand * command);
 
     void apply(StorageInMemoryMetadata & metadata, const Context & context) const;
 
+    /// Checks that alter query changes data. For MergeTree:
+    ///    * column files (data and marks)
+    ///    * each part meta (columns.txt)
+    /// in each part on disk (it's not lightweight alter).
+    bool isModifyingData(const StorageInMemoryMetadata & metadata) const;
+
     /// Check that alter command require data modification (mutation) to be
     /// executed. For example, cast from Date to UInt16 type can be executed
     /// without any data modifications. But column drop or modify from UInt16 to
@@ -161,6 +164,9 @@ public:
     /// Commands have to be prepared before apply.
     void apply(StorageInMemoryMetadata & metadata, const Context & context) const;
 
+    /// At least one command modify data on disk.
+    bool isModifyingData(const StorageInMemoryMetadata & metadata) const;
+
     /// At least one command modify settings.
     bool isSettingsAlter() const;
 
diff --git a/tests/integration/test_adaptive_granularity/test.py b/tests/integration/test_adaptive_granularity/test.py
index d5ac91671e0..21d65588de4 100644
--- a/tests/integration/test_adaptive_granularity/test.py
+++ b/tests/integration/test_adaptive_granularity/test.py
@@ -298,7 +298,7 @@ def test_mixed_granularity_single_node(start_dynamic_cluster, node):
     #still works
     assert node.query("SELECT count() from table_with_default_granularity") == '6\n'
 
-@pytest.mark.skip(reason="flaky")
+
 def test_version_update_two_nodes(start_dynamic_cluster):
     node11.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
     node12.query("SYSTEM SYNC REPLICA table_with_default_granularity", timeout=20)
diff --git a/tests/queries/0_stateless/01493_alter_remove_properties.reference b/tests/queries/0_stateless/01493_alter_remove_properties.reference
deleted file mode 100644
index 4ce7a574742..00000000000
--- a/tests/queries/0_stateless/01493_alter_remove_properties.reference
+++ /dev/null
@@ -1,17 +0,0 @@
-CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64 MATERIALIZED column_default * 42,\n    `column_alias` UInt64 ALIAS column_default + 1,\n    `column_codec` String CODEC(ZSTD(10)),\n    `column_comment` Date COMMENT \'Some comment\',\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
-42	1764	43	str	2019-10-01	1
-CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64 MATERIALIZED column_default * 42,\n    `column_alias` UInt64 ALIAS column_default + 1,\n    `column_codec` String CODEC(ZSTD(10)),\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
-CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64 MATERIALIZED column_default * 42,\n    `column_alias` UInt64 ALIAS column_default + 1,\n    `column_codec` String,\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
-42	1764	0	str	2019-10-01	1
-CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64 MATERIALIZED column_default * 42,\n    `column_alias` UInt64,\n    `column_codec` String,\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
-42	1764	0	str	2019-10-01	1
-42	1764	33	trs	2020-01-01	2
-CREATE TABLE default.prop_table\n(\n    `column_default` UInt64 DEFAULT 42,\n    `column_materialized` UInt64,\n    `column_alias` UInt64,\n    `column_codec` String,\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
-42	1764	0	str	2019-10-01	1
-42	1764	33	trs	2020-01-01	2
-42	11	44	rts	2020-02-01	3
-CREATE TABLE default.prop_table\n(\n    `column_default` UInt64,\n    `column_materialized` UInt64,\n    `column_alias` UInt64,\n    `column_codec` String,\n    `column_comment` Date,\n    `column_ttl` UInt64 TTL column_comment + toIntervalMonth(1)\n)\nENGINE = MergeTree()\nORDER BY tuple()\nTTL column_comment + toIntervalMonth(2)\nSETTINGS index_granularity = 8192
-42	1764	0	str	2019-10-01	1
-42	1764	33	trs	2020-01-01	2
-42	11	44	rts	2020-02-01	3
-0	22	55	tsr	2020-03-01	4
diff --git a/tests/queries/0_stateless/01493_alter_remove_properties.sql b/tests/queries/0_stateless/01493_alter_remove_properties.sql
deleted file mode 100644
index 25000a50235..00000000000
--- a/tests/queries/0_stateless/01493_alter_remove_properties.sql
+++ /dev/null
@@ -1,58 +0,0 @@
-DROP TABLE IF EXISTS prop_table;
-
-CREATE TABLE prop_table
-(
-    column_default UInt64 DEFAULT 42,
-    column_materialized UInt64 MATERIALIZED column_default * 42,
-    column_alias UInt64 ALIAS column_default + 1,
-    column_codec String CODEC(ZSTD(10)),
-    column_comment Date COMMENT 'Some comment',
-    column_ttl UInt64 TTL column_comment + INTERVAL 1 MONTH
-)
-ENGINE MergeTree()
-ORDER BY tuple()
-TTL column_comment + INTERVAL 2 MONTH;
-
-SHOW CREATE TABLE prop_table;
-
-SYSTEM STOP TTL MERGES prop_table;
-
-INSERT INTO prop_table (column_codec, column_comment, column_ttl) VALUES ('str', toDate('2019-10-01'), 1);
-
-SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table;
-
-ALTER TABLE prop_table MODIFY COLUMN column_comment REMOVE COMMENT;
-
-SHOW CREATE TABLE prop_table;
-
-ALTER TABLE prop_table MODIFY COLUMN column_codec REMOVE CODEC;
-
-SHOW CREATE TABLE prop_table;
-
-ALTER TABLE prop_table MODIFY COLUMN column_alias REMOVE ALIAS;
-
-SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table;
-
-SHOW CREATE TABLE prop_table;
-
-INSERT INTO prop_table (column_alias, column_codec, column_comment, column_ttl) VALUES (33, 'trs', toDate('2020-01-01'), 2);
-
-SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table ORDER BY column_ttl;
-
-ALTER TABLE prop_table MODIFY COLUMN column_materialized REMOVE MATERIALIZED;
-
-SHOW CREATE TABLE prop_table;
-
-INSERT INTO prop_table (column_materialized, column_alias, column_codec, column_comment, column_ttl) VALUES (11, 44, 'rts', toDate('2020-02-01'), 3);
-
-SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table ORDER BY column_ttl;
-
-ALTER TABLE prop_table MODIFY COLUMN column_default REMOVE DEFAULT;
-
-SHOW CREATE TABLE prop_table;
-
-INSERT INTO prop_table (column_materialized, column_alias, column_codec, column_comment, column_ttl) VALUES (22, 55, 'tsr', toDate('2020-03-01'), 4);
-
-SELECT column_default, column_materialized, column_alias, column_codec, column_comment, column_ttl FROM prop_table ORDER BY column_ttl;
-
-DROP TABLE IF EXISTS prop_table;

From 36019596c1dd2667f1ee0900ba3d75b63a1c82c1 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 11 Sep 2020 20:08:23 +0300
Subject: [PATCH 149/341] Disable flaky test

---
 tests/integration/test_adaptive_granularity/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_adaptive_granularity/test.py b/tests/integration/test_adaptive_granularity/test.py
index 21d65588de4..d5ac91671e0 100644
--- a/tests/integration/test_adaptive_granularity/test.py
+++ b/tests/integration/test_adaptive_granularity/test.py
@@ -298,7 +298,7 @@ def test_mixed_granularity_single_node(start_dynamic_cluster, node):
     #still works
     assert node.query("SELECT count() from table_with_default_granularity") == '6\n'
 
-
+@pytest.mark.skip(reason="flaky")
 def test_version_update_two_nodes(start_dynamic_cluster):
     node11.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
     node12.query("SYSTEM SYNC REPLICA table_with_default_granularity", timeout=20)

From e2c2a679ef6a932d0372ca0a6f019bdca64c19e8 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitbar@yandex-team.ru>
Date: Fri, 11 Sep 2020 19:54:22 +0300
Subject: [PATCH 150/341] Skip access storages with same path while reading the
 main config.

---
 src/Access/AccessControlManager.cpp           | 30 +++++++++++++++++-
 src/Access/DiskAccessStorage.cpp              | 31 +++++++++++++------
 src/Access/DiskAccessStorage.h                |  6 +++-
 .../configs/duplicates.xml                    | 13 ++++++++
 .../configs/mixed_style.xml                   |  3 ++
 .../integration/test_user_directories/test.py | 16 ++++++----
 6 files changed, 81 insertions(+), 18 deletions(-)
 create mode 100644 tests/integration/test_user_directories/configs/duplicates.xml

diff --git a/src/Access/AccessControlManager.cpp b/src/Access/AccessControlManager.cpp
index 1fa26c85354..41137867213 100644
--- a/src/Access/AccessControlManager.cpp
+++ b/src/Access/AccessControlManager.cpp
@@ -181,6 +181,15 @@ void AccessControlManager::addUsersConfigStorage(
     const String & preprocessed_dir_,
     const zkutil::GetZooKeeper & get_zookeeper_function_)
 {
+    auto storages = getStoragesPtr();
+    for (const auto & storage : *storages)
+    {
+        if (auto users_config_storage = typeid_cast<std::shared_ptr<UsersConfigAccessStorage>>(storage))
+        {
+            if (users_config_storage->getStoragePath() == users_config_path_)
+                return;
+        }
+    }
     auto check_setting_name_function = [this](const std::string_view & setting_name) { checkSettingNameIsAllowed(setting_name); };
     auto new_storage = std::make_shared<UsersConfigAccessStorage>(storage_name_, check_setting_name_function);
     new_storage->load(users_config_path_, include_from_path_, preprocessed_dir_, get_zookeeper_function_);
@@ -210,17 +219,36 @@ void AccessControlManager::startPeriodicReloadingUsersConfigs()
 
 void AccessControlManager::addDiskStorage(const String & directory_, bool readonly_)
 {
-    addStorage(std::make_shared<DiskAccessStorage>(directory_, readonly_));
+    addDiskStorage(DiskAccessStorage::STORAGE_TYPE, directory_, readonly_);
 }
 
 void AccessControlManager::addDiskStorage(const String & storage_name_, const String & directory_, bool readonly_)
 {
+    auto storages = getStoragesPtr();
+    for (const auto & storage : *storages)
+    {
+        if (auto disk_storage = typeid_cast<std::shared_ptr<DiskAccessStorage>>(storage))
+        {
+            if (disk_storage->isStoragePathEqual(directory_))
+            {
+                if (readonly_)
+                    disk_storage->setReadOnly(readonly_);
+                return;
+            }
+        }
+    }
     addStorage(std::make_shared<DiskAccessStorage>(storage_name_, directory_, readonly_));
 }
 
 
 void AccessControlManager::addMemoryStorage(const String & storage_name_)
 {
+    auto storages = getStoragesPtr();
+    for (const auto & storage : *storages)
+    {
+        if (auto memory_storage = typeid_cast<std::shared_ptr<MemoryAccessStorage>>(storage))
+            return;
+    }
     addStorage(std::make_shared<MemoryAccessStorage>(storage_name_));
 }
 
diff --git a/src/Access/DiskAccessStorage.cpp b/src/Access/DiskAccessStorage.cpp
index fc80859885d..2fcb9480e67 100644
--- a/src/Access/DiskAccessStorage.cpp
+++ b/src/Access/DiskAccessStorage.cpp
@@ -218,6 +218,16 @@ namespace
     }
 
 
+    /// Converts a path to an absolute path and append it with a separator.
+    String makeDirectoryPathCanonical(const String & directory_path)
+    {
+        auto canonical_directory_path = std::filesystem::weakly_canonical(directory_path);
+        if (canonical_directory_path.has_filename())
+            canonical_directory_path += std::filesystem::path::preferred_separator;
+        return canonical_directory_path;
+    }
+
+
     /// Calculates the path to a file named <id>.sql for saving an access entity.
     String getEntityFilePath(const String & directory_path, const UUID & id)
     {
@@ -298,22 +308,17 @@ DiskAccessStorage::DiskAccessStorage(const String & directory_path_, bool readon
 {
 }
 
-
 DiskAccessStorage::DiskAccessStorage(const String & storage_name_, const String & directory_path_, bool readonly_)
     : IAccessStorage(storage_name_)
 {
-    auto canonical_directory_path = std::filesystem::weakly_canonical(directory_path_);
-    if (canonical_directory_path.has_filename())
-        canonical_directory_path += std::filesystem::path::preferred_separator;
+    directory_path = makeDirectoryPathCanonical(directory_path_);
+    readonly = readonly_;
 
     std::error_code create_dir_error_code;
-    std::filesystem::create_directories(canonical_directory_path, create_dir_error_code);
+    std::filesystem::create_directories(directory_path, create_dir_error_code);
 
-    if (!std::filesystem::exists(canonical_directory_path) || !std::filesystem::is_directory(canonical_directory_path) || create_dir_error_code)
-        throw Exception("Couldn't create directory " + canonical_directory_path.string() + " reason: '" + create_dir_error_code.message() + "'", ErrorCodes::DIRECTORY_DOESNT_EXIST);
-
-    directory_path = canonical_directory_path;
-    readonly = readonly_;
+    if (!std::filesystem::exists(directory_path) || !std::filesystem::is_directory(directory_path) || create_dir_error_code)
+        throw Exception("Couldn't create directory " + directory_path + " reason: '" + create_dir_error_code.message() + "'", ErrorCodes::DIRECTORY_DOESNT_EXIST);
 
     bool should_rebuild_lists = std::filesystem::exists(getNeedRebuildListsMarkFilePath(directory_path));
     if (!should_rebuild_lists)
@@ -337,6 +342,12 @@ DiskAccessStorage::~DiskAccessStorage()
 }
 
 
+bool DiskAccessStorage::isStoragePathEqual(const String & directory_path_) const
+{
+    return getStoragePath() == makeDirectoryPathCanonical(directory_path_);
+}
+
+
 void DiskAccessStorage::clear()
 {
     entries_by_id.clear();
diff --git a/src/Access/DiskAccessStorage.h b/src/Access/DiskAccessStorage.h
index 11eb1c3b1ad..f136b046ace 100644
--- a/src/Access/DiskAccessStorage.h
+++ b/src/Access/DiskAccessStorage.h
@@ -18,7 +18,11 @@ public:
     ~DiskAccessStorage() override;
 
     const char * getStorageType() const override { return STORAGE_TYPE; }
+
     String getStoragePath() const override { return directory_path; }
+    bool isStoragePathEqual(const String & directory_path_) const;
+
+    void setReadOnly(bool readonly_) { readonly = readonly_; }
     bool isStorageReadOnly() const override { return readonly; }
 
 private:
@@ -67,7 +71,7 @@ private:
     void prepareNotifications(const UUID & id, const Entry & entry, bool remove, Notifications & notifications) const;
 
     String directory_path;
-    bool readonly;
+    std::atomic<bool> readonly;
     std::unordered_map<UUID, Entry> entries_by_id;
     std::unordered_map<std::string_view, Entry *> entries_by_name_and_type[static_cast<size_t>(EntityType::MAX)];
     boost::container::flat_set<EntityType> types_of_lists_to_write;
diff --git a/tests/integration/test_user_directories/configs/duplicates.xml b/tests/integration/test_user_directories/configs/duplicates.xml
new file mode 100644
index 00000000000..69bb06a112b
--- /dev/null
+++ b/tests/integration/test_user_directories/configs/duplicates.xml
@@ -0,0 +1,13 @@
+<yandex>
+    <user_directories replace="replace">
+        <local_directory>
+            <path>/var/lib/clickhouse/access7/</path>
+        </local_directory>
+        <users_xml>
+            <path>/etc/clickhouse-server/users7.xml</path>
+        </users_xml>
+    </user_directories>
+
+    <users_config>/etc/clickhouse-server/users7.xml</users_config>
+    <access_control_path>/var/lib/clickhouse/access7/</access_control_path>
+</yandex>
diff --git a/tests/integration/test_user_directories/configs/mixed_style.xml b/tests/integration/test_user_directories/configs/mixed_style.xml
index d6ddecf6f5d..f668140521a 100644
--- a/tests/integration/test_user_directories/configs/mixed_style.xml
+++ b/tests/integration/test_user_directories/configs/mixed_style.xml
@@ -1,5 +1,8 @@
 <yandex>
     <user_directories replace="replace">
+        <local_directory>
+            <path>/var/lib/clickhouse/access6a/</path>
+        </local_directory>
         <memory/>
     </user_directories>
 
diff --git a/tests/integration/test_user_directories/test.py b/tests/integration/test_user_directories/test.py
index 218330cb1a5..71745502064 100644
--- a/tests/integration/test_user_directories/test.py
+++ b/tests/integration/test_user_directories/test.py
@@ -12,11 +12,8 @@ def started_cluster():
     try:
         cluster.start()
 
-        node.exec_in_container("cp /etc/clickhouse-server/users.xml /etc/clickhouse-server/users2.xml")
-        node.exec_in_container("cp /etc/clickhouse-server/users.xml /etc/clickhouse-server/users3.xml")
-        node.exec_in_container("cp /etc/clickhouse-server/users.xml /etc/clickhouse-server/users4.xml")
-        node.exec_in_container("cp /etc/clickhouse-server/users.xml /etc/clickhouse-server/users5.xml")
-        node.exec_in_container("cp /etc/clickhouse-server/users.xml /etc/clickhouse-server/users6.xml")
+        for i in range(2, 8):
+            node.exec_in_container("cp /etc/clickhouse-server/users.xml /etc/clickhouse-server/users{}.xml".format(i))
 
         yield cluster
 
@@ -56,4 +53,11 @@ def test_mixed_style():
     node.restart_clickhouse()
     assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       "/etc/clickhouse-server/users6.xml", 1, 1],
                                                                        ["local directory", "local directory", "/var/lib/clickhouse/access6/",      0, 2],
-                                                                       ["memory",          "memory",          "",                                  0, 3]])
+                                                                       ["local directory", "local directory", "/var/lib/clickhouse/access6a/",     0, 3],
+                                                                       ["memory",          "memory",          "",                                  0, 4]])
+
+def test_duplicates():
+    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/duplicates.xml"), '/etc/clickhouse-server/config.d/z.xml')
+    node.restart_clickhouse()
+    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       "/etc/clickhouse-server/users7.xml", 1, 1],
+                                                                       ["local directory", "local directory", "/var/lib/clickhouse/access7/",      0, 2]])

From 1e849f297549f90bd7671286cace24f36c14e801 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitbar@yandex-team.ru>
Date: Sat, 12 Sep 2020 03:16:50 +0300
Subject: [PATCH 151/341] Fix permission denied on opening file
 /var/lib/clickhouse/status in integration tests.

---
 tests/integration/helpers/cluster.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 44a22d3fe2e..a8704ee42b1 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1165,6 +1165,7 @@ class ClickHouseInstance:
 
         db_dir = p.abspath(p.join(self.path, 'database'))
         print "Setup database dir {}".format(db_dir)
+        os.mkdir(db_dir)
         if self.clickhouse_path_dir is not None:
             print "Database files taken from {}".format(self.clickhouse_path_dir)
             shutil.copytree(self.clickhouse_path_dir, db_dir)

From e12ae99bf7e4b717b30179ac1a65920954cb3656 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sat, 12 Sep 2020 03:55:54 +0300
Subject: [PATCH 152/341] Added review suggestion

---
 programs/git-import/git-import.cpp | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/programs/git-import/git-import.cpp b/programs/git-import/git-import.cpp
index d314969a1a8..6e92b88734d 100644
--- a/programs/git-import/git-import.cpp
+++ b/programs/git-import/git-import.cpp
@@ -335,7 +335,7 @@ struct LineChange
       */
     void setLineInfo(std::string full_line)
     {
-        indent = 0;
+        uint32_t num_spaces = 0;
 
         const char * pos = full_line.data();
         const char * end = pos + full_line.size();
@@ -343,14 +343,15 @@ struct LineChange
         while (pos < end)
         {
             if (*pos == ' ')
-                ++indent;
+                ++num_spaces;
             else if (*pos == '\t')
-                indent += 4;
+                num_spaces += 4;
             else
                 break;
             ++pos;
         }
 
+        indent = std::max(255U, num_spaces);
         line.assign(pos, end);
 
         if (pos == end)

From 5b952a369bec6ec4696e5e202e0b5ddedf6be72f Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Sat, 12 Sep 2020 12:07:02 +0800
Subject: [PATCH 153/341] Fix build failure in OSX

---
 src/Functions/GatherUtils/CMakeLists.txt | 11 +++++++++++
 src/Functions/GatherUtils/Sources.h      |  4 ++++
 2 files changed, 15 insertions(+)

diff --git a/src/Functions/GatherUtils/CMakeLists.txt b/src/Functions/GatherUtils/CMakeLists.txt
index 3f7f08621a1..f941091667e 100644
--- a/src/Functions/GatherUtils/CMakeLists.txt
+++ b/src/Functions/GatherUtils/CMakeLists.txt
@@ -3,6 +3,17 @@ add_headers_and_sources(clickhouse_functions_gatherutils .)
 add_library(clickhouse_functions_gatherutils ${clickhouse_functions_gatherutils_sources} ${clickhouse_functions_gatherutils_headers})
 target_link_libraries(clickhouse_functions_gatherutils PRIVATE dbms)
 
+check_cxx_compiler_flag(suggest-override HAS_SUGGEST_OVERRIDE)
+check_cxx_compiler_flag(suggest-destructor-override HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
+
+if (HAS_SUGGEST_OVERRIDE)
+    target_compile_definitions(clickhouse_functions_gatherutils PRIVATE HAS_SUGGEST_OVERRIDE)
+endif()
+
+if (HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
+    target_compile_definitions(clickhouse_functions_gatherutils PRIVATE HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
+endif()
+
 if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)
     target_compile_options(clickhouse_functions_gatherutils PRIVATE "-g0")
 endif()
diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 299884e1c9e..fe71a1f8be3 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -129,9 +129,13 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
     #pragma GCC diagnostic ignored "-Wsuggest-override"
 #elif __clang_major__ >= 11
     #pragma GCC diagnostic push
+#ifdef HAS_SUGGEST_OVERRIDE
     #pragma GCC diagnostic ignored "-Wsuggest-override"
+#endif
+#ifdef HAS_SUGGEST_DESTRUCTOR_OVERRIDE
     #pragma GCC diagnostic ignored "-Wsuggest-destructor-override"
 #endif
+#endif
 
 template <typename Base>
 struct ConstSource : public Base

From ecbcbad0d96f3d7173d535f9bb181f6104e67ff7 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sat, 12 Sep 2020 10:07:08 +0300
Subject: [PATCH 154/341] Fix flaky test

---
 .../01465_ttl_recompression.reference         | 42 +++++++++----------
 .../0_stateless/01465_ttl_recompression.sql   | 19 +++++----
 2 files changed, 32 insertions(+), 29 deletions(-)

diff --git a/tests/queries/0_stateless/01465_ttl_recompression.reference b/tests/queries/0_stateless/01465_ttl_recompression.reference
index 524c44ef972..1c576c04e45 100644
--- a/tests/queries/0_stateless/01465_ttl_recompression.reference
+++ b/tests/queries/0_stateless/01465_ttl_recompression.reference
@@ -1,24 +1,24 @@
 CREATE TABLE default.recompression_table\n(\n    `dt` DateTime,\n    `key` UInt64,\n    `value` String\n)\nENGINE = MergeTree()\nPARTITION BY key\nORDER BY tuple()\nTTL dt + toIntervalMonth(1) RECOMPRESS CODEC(ZSTD(17)), dt + toIntervalYear(1) RECOMPRESS CODEC(LZ4HC(10))\nSETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, index_granularity = 8192
 3000
-1_1_1_0	LZ4
-2_2_2_0	LZ4
-3_3_3_0	LZ4
-1_1_1_1	LZ4
-2_2_2_1	ZSTD(17)
-3_3_3_1	LZ4HC(10)
+1_1_1	LZ4
+2_2_2	LZ4
+3_3_3	LZ4
+1_1_1	LZ4
+2_2_2	ZSTD(17)
+3_3_3	LZ4HC(10)
 CREATE TABLE default.recompression_table\n(\n    `dt` DateTime,\n    `key` UInt64,\n    `value` String\n)\nENGINE = MergeTree()\nPARTITION BY key\nORDER BY tuple()\nTTL dt + toIntervalDay(1) RECOMPRESS CODEC(ZSTD(12))\nSETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, index_granularity = 8192
-1_1_1_1_4	LZ4
-2_2_2_1_4	ZSTD(17)
-3_3_3_1_4	LZ4HC(10)
-1_1_1_2_4	LZ4
-2_2_2_2_4	ZSTD(12)
-3_3_3_2_4	ZSTD(12)
-1_1_1_2_4	['plus(dt, toIntervalDay(1))']
-2_2_2_2_4	['plus(dt, toIntervalDay(1))']
-3_3_3_2_4	['plus(dt, toIntervalDay(1))']
-1_1_1_0	LZ4
-2_2_2_0	LZ4
-3_3_3_0	LZ4
-1_1_1_0_4	LZ4
-2_2_2_0_4	ZSTD(12)
-3_3_3_0_4	ZSTD(12)
+1_1_1	LZ4
+2_2_2	ZSTD(17)
+3_3_3	LZ4HC(10)
+1_1_1	LZ4
+2_2_2	ZSTD(12)
+3_3_3	ZSTD(12)
+1_1_1	['plus(dt, toIntervalDay(1))']
+2_2_2	['plus(dt, toIntervalDay(1))']
+3_3_3	['plus(dt, toIntervalDay(1))']
+1_1_1	LZ4
+2_2_2	LZ4
+3_3_3	LZ4
+1_1_1	LZ4
+2_2_2	ZSTD(12)
+3_3_3	ZSTD(12)
diff --git a/tests/queries/0_stateless/01465_ttl_recompression.sql b/tests/queries/0_stateless/01465_ttl_recompression.sql
index 78550582307..2388e727722 100644
--- a/tests/queries/0_stateless/01465_ttl_recompression.sql
+++ b/tests/queries/0_stateless/01465_ttl_recompression.sql
@@ -24,25 +24,27 @@ INSERT INTO recompression_table SELECT now() - INTERVAL 2 YEAR, 3, toString(numb
 
 SELECT COUNT() FROM recompression_table;
 
-SELECT name, default_compression_codec FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
+SELECT substring(name, 1, length(name) - 2), default_compression_codec FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
 
 OPTIMIZE TABLE recompression_table FINAL;
 
-SELECT name, default_compression_codec FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
+-- merge level and mutation in part name is not important
+SELECT substring(name, 1, length(name) - 2), default_compression_codec FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
 
 ALTER TABLE recompression_table MODIFY TTL dt + INTERVAL 1 DAY RECOMPRESS CODEC(ZSTD(12)) SETTINGS mutations_sync = 2;
 
 SHOW CREATE TABLE recompression_table;
 
-SELECT name, default_compression_codec FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
+SELECT substring(name, 1, length(name) - 4), default_compression_codec FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
 
 SYSTEM START TTL MERGES recompression_table;
-
+-- Additional merge can happen here
 OPTIMIZE TABLE recompression_table FINAL;
 
-SELECT name, default_compression_codec FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
+-- merge level and mutation in part name is not important
+SELECT substring(name, 1, length(name) - 4), default_compression_codec FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
 
-SELECT name, recompression_ttl_info.expression FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
+SELECT substring(name, 1, length(name) - 4), recompression_ttl_info.expression FROM system.parts WHERE table = 'recompression_table' and active = 1 and database = currentDatabase() ORDER BY name;
 
 DROP TABLE IF EXISTS recompression_table;
 
@@ -66,10 +68,11 @@ INSERT INTO recompression_table_compact SELECT now() - INTERVAL 2 MONTH, 2, toSt
 
 INSERT INTO recompression_table_compact SELECT now() - INTERVAL 2 YEAR, 3, toString(number) from numbers(2000, 1000);
 
-SELECT name, default_compression_codec FROM system.parts WHERE table = 'recompression_table_compact' and active = 1 and database = currentDatabase() ORDER BY name;
+SELECT substring(name, 1, length(name) - 2), default_compression_codec FROM system.parts WHERE table = 'recompression_table_compact' and active = 1 and database = currentDatabase() ORDER BY name;
 
 ALTER TABLE recompression_table_compact MODIFY TTL dt + INTERVAL 1 MONTH RECOMPRESS CODEC(ZSTD(12)) SETTINGS mutations_sync = 2; -- mutation affect all columns, so codec changes
 
-SELECT name, default_compression_codec FROM system.parts WHERE table = 'recompression_table_compact' and active = 1 and database = currentDatabase() ORDER BY name;
+-- merge level and mutation in part name is not important
+SELECT substring(name, 1, length(name) - 4), default_compression_codec FROM system.parts WHERE table = 'recompression_table_compact' and active = 1 and database = currentDatabase() ORDER BY name;
 
 DROP TABLE recompression_table_compact;

From 8242a948804622f71eeaba1ad91a6e1cd14ab683 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sat, 12 Sep 2020 15:42:07 +0300
Subject: [PATCH 155/341] Update ci_config.json

---
 tests/ci/ci_config.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/ci_config.json b/tests/ci/ci_config.json
index 9a11a06db0d..504b554029b 100644
--- a/tests/ci/ci_config.json
+++ b/tests/ci/ci_config.json
@@ -323,7 +323,7 @@
         },
         "Functional stateless tests (unbundled)": {
             "required_build_properties": {
-                "compiler": "gcc-10",
+                "compiler": "gcc-9",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",

From 8075ce28099ea34f26209ab5eba7c8eb9bc603b2 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sat, 12 Sep 2020 15:42:32 +0300
Subject: [PATCH 156/341] Update warnings.cmake

---
 cmake/warnings.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmake/warnings.cmake b/cmake/warnings.cmake
index 6b26b9b95a5..425972f00d8 100644
--- a/cmake/warnings.cmake
+++ b/cmake/warnings.cmake
@@ -23,7 +23,7 @@ option (WEVERYTHING "Enables -Weverything option with some exceptions. This is i
 # Control maximum size of stack frames. It can be important if the code is run in fibers with small stack size.
 # Only in release build because debug has too large stack frames.
 if ((NOT CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG") AND (NOT SANITIZE))
-    add_warning(frame-larger-than=32768)
+    add_warning(frame-larger-than=16384)
 endif ()
 
 if (COMPILER_CLANG)

From 421eeeccef7622f8f1462f9bce87303d51b880be Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitbar@yandex-team.ru>
Date: Mon, 17 Aug 2020 17:38:10 +0300
Subject: [PATCH 157/341] Add the section user_directories to the default
 config.

---
 programs/server/config.xml                       | 16 +++++++++++-----
 .../helpers/0_common_instance_config.xml         |  3 +++
 2 files changed, 14 insertions(+), 5 deletions(-)

diff --git a/programs/server/config.xml b/programs/server/config.xml
index af01e880dc2..3d7ebf0cd96 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -212,8 +212,17 @@
     <!-- Directory with user provided files that are accessible by 'file' table function. -->
     <user_files_path>/var/lib/clickhouse/user_files/</user_files_path>
 
-    <!-- Path to folder where users and roles created by SQL commands are stored. -->
-    <access_control_path>/var/lib/clickhouse/access/</access_control_path>
+    <!-- Sources to read users, roles, access rights, profiles of settings, quotas. -->
+    <user_directories>
+        <users_xml>
+            <!-- Path to configuration file with predefined users. -->
+            <path>users.xml</path>
+        </users_xml>
+        <local_directory>
+            <!-- Path to folder where users created by SQL commands are stored. -->
+            <path>/var/lib/clickhouse/access/</path>
+        </local_directory>
+    </user_directories>
 
     <!-- External user directories (LDAP). -->
     <ldap_servers>
@@ -256,9 +265,6 @@
         -->
     </ldap_servers>
 
-    <!-- Path to configuration file with users, access rights, profiles of settings, quotas. -->
-    <users_config>users.xml</users_config>
-
     <!-- Default profile of settings. -->
     <default_profile>default</default_profile>
 
diff --git a/tests/integration/helpers/0_common_instance_config.xml b/tests/integration/helpers/0_common_instance_config.xml
index 5377efbc241..b27ecf0c3ef 100644
--- a/tests/integration/helpers/0_common_instance_config.xml
+++ b/tests/integration/helpers/0_common_instance_config.xml
@@ -4,4 +4,7 @@
     <custom_settings_prefixes>custom_</custom_settings_prefixes>
     <path>/var/lib/clickhouse/</path>
     <tmp_path>/var/lib/clickhouse/tmp/</tmp_path>
+
+    <!-- For tests which check compatibility with older versions. -->
+    <users_config>users.xml</users_config>
 </yandex>

From c2d79bc5ccb04aeef881379797c05d57e290782b Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Thu, 10 Sep 2020 22:56:15 +0800
Subject: [PATCH 158/341] Add merge_algorithm to system.merges

---
 docs/en/operations/system-tables/merges.md    |  6 ++++-
 src/Storages/MergeTree/MergeAlgorithm.cpp     | 26 +++++++++++++++++++
 src/Storages/MergeTree/MergeAlgorithm.h       | 17 ++++++++++++
 src/Storages/MergeTree/MergeList.cpp          |  2 ++
 src/Storages/MergeTree/MergeList.h            |  3 +++
 .../MergeTree/MergeTreeDataMergerMutator.cpp  |  7 ++---
 .../MergeTree/MergeTreeDataMergerMutator.h    |  7 +----
 src/Storages/System/StorageSystemMerges.cpp   |  7 +++++
 src/Storages/ya.make                          |  1 +
 9 files changed, 64 insertions(+), 12 deletions(-)
 create mode 100644 src/Storages/MergeTree/MergeAlgorithm.cpp
 create mode 100644 src/Storages/MergeTree/MergeAlgorithm.h

diff --git a/docs/en/operations/system-tables/merges.md b/docs/en/operations/system-tables/merges.md
index fb98a2b9e34..3e712e2962c 100644
--- a/docs/en/operations/system-tables/merges.md
+++ b/docs/en/operations/system-tables/merges.md
@@ -10,12 +10,16 @@ Columns:
 -   `progress` (Float64) — The percentage of completed work from 0 to 1.
 -   `num_parts` (UInt64) — The number of pieces to be merged.
 -   `result_part_name` (String) — The name of the part that will be formed as the result of merging.
--   `is_mutation` (UInt8) - 1 if this process is a part mutation.
+-   `is_mutation` (UInt8) — 1 if this process is a part mutation.
 -   `total_size_bytes_compressed` (UInt64) — The total size of the compressed data in the merged chunks.
 -   `total_size_marks` (UInt64) — The total number of marks in the merged parts.
 -   `bytes_read_uncompressed` (UInt64) — Number of bytes read, uncompressed.
 -   `rows_read` (UInt64) — Number of rows read.
 -   `bytes_written_uncompressed` (UInt64) — Number of bytes written, uncompressed.
 -   `rows_written` (UInt64) — Number of rows written.
+-   `memory_usage` (UInt64) — Memory consumption of the merge process.
+-   `thread_id` (UInt64) — Thread ID of the merge process.
+-   `merge_type` — The type of current merge. Empty if it's an mutation.
+-   `merge_algorithm` — The algorithm used in current merge. Empty if it's an mutation.
 
 [Original article](https://clickhouse.tech/docs/en/operations/system_tables/merges) <!--hide-->
diff --git a/src/Storages/MergeTree/MergeAlgorithm.cpp b/src/Storages/MergeTree/MergeAlgorithm.cpp
new file mode 100644
index 00000000000..9f73557e701
--- /dev/null
+++ b/src/Storages/MergeTree/MergeAlgorithm.cpp
@@ -0,0 +1,26 @@
+#include <Storages/MergeTree/MergeAlgorithm.h>
+#include <Common/Exception.h>
+
+namespace DB
+{
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
+}
+
+String toString(MergeAlgorithm merge_algorithm)
+{
+    switch (merge_algorithm)
+    {
+        case MergeAlgorithm::Undecided:
+            return "Undecided";
+        case MergeAlgorithm::Horizontal:
+            return "Horizontal";
+        case MergeAlgorithm::Vertical:
+            return "Vertical";
+    }
+
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unknown MergeAlgorithm {}", static_cast<UInt64>(merge_algorithm));
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeAlgorithm.h b/src/Storages/MergeTree/MergeAlgorithm.h
new file mode 100644
index 00000000000..813767f9fb1
--- /dev/null
+++ b/src/Storages/MergeTree/MergeAlgorithm.h
@@ -0,0 +1,17 @@
+#pragma once
+
+#include <Core/Types.h>
+
+namespace DB
+{
+/// Algorithm of Merge.
+enum class MergeAlgorithm
+{
+    Undecided, /// Not running yet
+    Horizontal, /// per-row merge of all columns
+    Vertical /// per-row merge of PK and secondary indices columns, per-column gather for non-PK columns
+};
+
+String toString(MergeAlgorithm merge_algorithm);
+
+}
diff --git a/src/Storages/MergeTree/MergeList.cpp b/src/Storages/MergeTree/MergeList.cpp
index 30324bd5d9e..05d4cc6f963 100644
--- a/src/Storages/MergeTree/MergeList.cpp
+++ b/src/Storages/MergeTree/MergeList.cpp
@@ -24,6 +24,7 @@ MergeListElement::MergeListElement(const std::string & database_, const std::str
     , num_parts{future_part.parts.size()}
     , thread_id{getThreadId()}
     , merge_type{future_part.merge_type}
+    , merge_algorithm{MergeAlgorithm::Undecided}
 {
     for (const auto & source_part : future_part.parts)
     {
@@ -74,6 +75,7 @@ MergeInfo MergeListElement::getInfo() const
     res.memory_usage = memory_tracker.get();
     res.thread_id = thread_id;
     res.merge_type = toString(merge_type);
+    res.merge_algorithm = toString(merge_algorithm);
 
     for (const auto & source_part_name : source_part_names)
         res.source_part_names.emplace_back(source_part_name);
diff --git a/src/Storages/MergeTree/MergeList.h b/src/Storages/MergeTree/MergeList.h
index 4d080ff3569..c1166c55703 100644
--- a/src/Storages/MergeTree/MergeList.h
+++ b/src/Storages/MergeTree/MergeList.h
@@ -3,6 +3,7 @@
 #include <Common/Stopwatch.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/MemoryTracker.h>
+#include <Storages/MergeTree/MergeAlgorithm.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/MergeType.h>
 #include <memory>
@@ -47,6 +48,7 @@ struct MergeInfo
     UInt64 memory_usage;
     UInt64 thread_id;
     std::string merge_type;
+    std::string merge_algorithm;
 };
 
 struct FutureMergedMutatedPart;
@@ -90,6 +92,7 @@ struct MergeListElement : boost::noncopyable
 
     UInt64 thread_id;
     MergeType merge_type;
+    MergeAlgorithm merge_algorithm;
 
     MergeListElement(const std::string & database, const std::string & table, const FutureMergedMutatedPart & future_part);
 
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index a8f7e265f68..99be79390be 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -62,10 +62,6 @@ namespace ErrorCodes
     extern const int ABORTED;
 }
 
-
-using MergeAlgorithm = MergeTreeDataMergerMutator::MergeAlgorithm;
-
-
 /// Do not start to merge parts, if free space is less than sum size of parts times specified coefficient.
 /// This value is chosen to not allow big merges to eat all free space. Thus allowing small merges to proceed.
 static const double DISK_USAGE_COEFFICIENT_TO_SELECT = 2;
@@ -699,6 +695,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
 
     size_t sum_input_rows_upper_bound = merge_entry->total_rows_count;
     MergeAlgorithm merge_alg = chooseMergeAlgorithm(parts, sum_input_rows_upper_bound, gathering_columns, deduplicate, need_remove_expired_values);
+    merge_entry->merge_algorithm = merge_alg;
 
     LOG_DEBUG(log, "Selected MergeAlgorithm: {}", ((merge_alg == MergeAlgorithm::Vertical) ? "Vertical" : "Horizontal"));
 
@@ -1238,7 +1235,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
 }
 
 
-MergeTreeDataMergerMutator::MergeAlgorithm MergeTreeDataMergerMutator::chooseMergeAlgorithm(
+MergeAlgorithm MergeTreeDataMergerMutator::chooseMergeAlgorithm(
     const MergeTreeData::DataPartsVector & parts, size_t sum_rows_upper_bound,
     const NamesAndTypesList & gathering_columns, bool deduplicate, bool need_remove_expired_values) const
 {
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
index 96ab14ba57b..2ba6b04e082 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
@@ -6,6 +6,7 @@
 #include <functional>
 #include <Common/ActionBlocker.h>
 #include <Storages/MergeTree/TTLMergeSelector.h>
+#include <Storages/MergeTree/MergeAlgorithm.h>
 #include <Storages/MergeTree/MergeType.h>
 
 
@@ -226,12 +227,6 @@ public :
     ActionBlocker merges_blocker;
     ActionBlocker ttl_merges_blocker;
 
-    enum class MergeAlgorithm
-    {
-        Horizontal, /// per-row merge of all columns
-        Vertical    /// per-row merge of PK and secondary indices columns, per-column gather for non-PK columns
-    };
-
 private:
 
     MergeAlgorithm chooseMergeAlgorithm(
diff --git a/src/Storages/System/StorageSystemMerges.cpp b/src/Storages/System/StorageSystemMerges.cpp
index 3b9e39c1ef8..b61324818e4 100644
--- a/src/Storages/System/StorageSystemMerges.cpp
+++ b/src/Storages/System/StorageSystemMerges.cpp
@@ -31,6 +31,7 @@ NamesAndTypesList StorageSystemMerges::getNamesAndTypes()
         {"memory_usage", std::make_shared<DataTypeUInt64>()},
         {"thread_id", std::make_shared<DataTypeUInt64>()},
         {"merge_type", std::make_shared<DataTypeString>()},
+        {"merge_algorithm", std::make_shared<DataTypeString>()},
     };
 }
 
@@ -67,9 +68,15 @@ void StorageSystemMerges::fillData(MutableColumns & res_columns, const Context &
         res_columns[i++]->insert(merge.memory_usage);
         res_columns[i++]->insert(merge.thread_id);
         if (!merge.is_mutation)
+        {
             res_columns[i++]->insert(merge.merge_type);
+            res_columns[i++]->insert(merge.merge_algorithm);
+        }
         else
+        {
             res_columns[i++]->insertDefault();
+            res_columns[i++]->insertDefault();
+        }
     }
 }
 
diff --git a/src/Storages/ya.make b/src/Storages/ya.make
index 597e0c6f975..20377428857 100644
--- a/src/Storages/ya.make
+++ b/src/Storages/ya.make
@@ -36,6 +36,7 @@ SRCS(
     MergeTree/KeyCondition.cpp
     MergeTree/LevelMergeSelector.cpp
     MergeTree/localBackup.cpp
+    MergeTree/MergeAlgorithm.cpp
     MergeTree/MergedBlockOutputStream.cpp
     MergeTree/MergedColumnOnlyOutputStream.cpp
     MergeTree/MergeList.cpp

From 016f707ea133f323ffd135a91ac86959112c6a8e Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Fri, 4 Sep 2020 01:51:16 +0800
Subject: [PATCH 159/341] column transformers in insert select

---
 src/Interpreters/InterpreterInsertQuery.cpp   | 26 ++++++++++++++++++-
 src/Parsers/ParserInsertQuery.cpp             |  9 ++++++-
 src/Parsers/ParserInsertQuery.h               |  9 +++++++
 ...1470_test_insert_select_asterisk.reference |  6 +++++
 .../01470_test_insert_select_asterisk.sql     | 18 +++++++++++++
 5 files changed, 66 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/01470_test_insert_select_asterisk.reference
 create mode 100644 tests/queries/0_stateless/01470_test_insert_select_asterisk.sql

diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index 9d33650405a..01fee30a445 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -17,6 +17,7 @@
 #include <Interpreters/InterpreterWatchQuery.h>
 #include <Interpreters/JoinedTables.h>
 #include <Parsers/ASTFunction.h>
+#include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTInsertQuery.h>
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
@@ -29,6 +30,8 @@
 #include <Storages/StorageDistributed.h>
 #include <TableFunctions/TableFunctionFactory.h>
 #include <Common/checkStackSize.h>
+#include <Interpreters/TranslateQualifiedNamesVisitor.h>
+#include <Interpreters/getTableExpressions.h>
 
 namespace
 {
@@ -90,9 +93,30 @@ Block InterpreterInsertQuery::getSampleBlock(
     }
 
     Block table_sample = metadata_snapshot->getSampleBlock();
+    const auto & columns = metadata_snapshot->getColumns();
+    auto names_and_types = columns.getOrdinary();
+    removeDuplicateColumns(names_and_types);
+    auto table_expr = std::make_shared<ASTTableExpression>();
+    table_expr->database_and_table_name = createTableIdentifier(table->getStorageID());
+    table_expr->children.push_back(table_expr->database_and_table_name);
+    TablesWithColumns tables_with_columns;
+    tables_with_columns.emplace_back(DatabaseAndTableWithAlias(*table_expr, context.getCurrentDatabase()), names_and_types);
+
+    tables_with_columns[0].addHiddenColumns(columns.getMaterialized());
+    tables_with_columns[0].addHiddenColumns(columns.getAliases());
+    tables_with_columns[0].addHiddenColumns(table->getVirtuals());
+
+    NameSet source_columns_set;
+    for (const auto & identifier : query.columns->children)
+        source_columns_set.insert(identifier->getColumnName());
+    TranslateQualifiedNamesVisitor::Data visitor_data(source_columns_set, tables_with_columns);
+    TranslateQualifiedNamesVisitor visitor(visitor_data);
+    auto columns_ast = query.columns->clone();
+    visitor.visit(columns_ast);
+
     /// Form the block based on the column names from the query
     Block res;
-    for (const auto & identifier : query.columns->children)
+    for (const auto & identifier : columns_ast->children)
     {
         std::string current_name = identifier->getColumnName();
 
diff --git a/src/Parsers/ParserInsertQuery.cpp b/src/Parsers/ParserInsertQuery.cpp
index dc25954c71f..50baf7566d1 100644
--- a/src/Parsers/ParserInsertQuery.cpp
+++ b/src/Parsers/ParserInsertQuery.cpp
@@ -36,7 +36,7 @@ bool ParserInsertQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     ParserToken s_lparen(TokenType::OpeningRoundBracket);
     ParserToken s_rparen(TokenType::ClosingRoundBracket);
     ParserIdentifier name_p;
-    ParserList columns_p(std::make_unique<ParserCompoundIdentifier>(), std::make_unique<ParserToken>(TokenType::Comma), false);
+    ParserList columns_p(std::make_unique<ParserInsertElement>(), std::make_unique<ParserToken>(TokenType::Comma), false);
     ParserFunction table_function_p{false};
 
     ASTPtr database;
@@ -189,5 +189,12 @@ bool ParserInsertQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     return true;
 }
 
+bool ParserInsertElement::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
+{
+    return ParserColumnsMatcher().parse(pos, node, expected)
+        || ParserQualifiedAsterisk().parse(pos, node, expected)
+        || ParserAsterisk().parse(pos, node, expected)
+        || ParserCompoundIdentifier().parse(pos, node, expected);
+}
 
 }
diff --git a/src/Parsers/ParserInsertQuery.h b/src/Parsers/ParserInsertQuery.h
index b69bc645c15..b6a199c9d71 100644
--- a/src/Parsers/ParserInsertQuery.h
+++ b/src/Parsers/ParserInsertQuery.h
@@ -33,4 +33,13 @@ public:
     ParserInsertQuery(const char * end_) : end(end_) {}
 };
 
+/** Insert accepts an identifier and an asterisk with variants.
+  */
+class ParserInsertElement : public IParserBase
+{
+protected:
+    const char * getName() const override { return "insert element"; }
+    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
+};
+
 }
diff --git a/tests/queries/0_stateless/01470_test_insert_select_asterisk.reference b/tests/queries/0_stateless/01470_test_insert_select_asterisk.reference
new file mode 100644
index 00000000000..c5d97af6937
--- /dev/null
+++ b/tests/queries/0_stateless/01470_test_insert_select_asterisk.reference
@@ -0,0 +1,6 @@
+1	0	0	2
+3	0	0	4
+1	0	0	2
+3	0	0	4
+1	0	0	2
+3	0	0	4
diff --git a/tests/queries/0_stateless/01470_test_insert_select_asterisk.sql b/tests/queries/0_stateless/01470_test_insert_select_asterisk.sql
new file mode 100644
index 00000000000..607b8a25f82
--- /dev/null
+++ b/tests/queries/0_stateless/01470_test_insert_select_asterisk.sql
@@ -0,0 +1,18 @@
+DROP TABLE IF EXISTS insert_select_dst;
+DROP TABLE IF EXISTS insert_select_src;
+
+CREATE TABLE insert_select_dst (i int, middle_a int, middle_b int, j int) ENGINE = Log;
+
+CREATE TABLE insert_select_src (i int, j int) ENGINE = Log;
+
+INSERT INTO insert_select_src VALUES (1, 2), (3, 4);
+
+INSERT INTO insert_select_dst(* EXCEPT (middle_a, middle_b)) SELECT * FROM insert_select_src;
+INSERT INTO insert_select_dst(insert_select_dst.* EXCEPT (middle_a, middle_b)) SELECT * FROM insert_select_src;
+INSERT INTO insert_select_dst(COLUMNS('.*') EXCEPT (middle_a, middle_b)) SELECT * FROM insert_select_src;
+INSERT INTO insert_select_dst(insert_select_src.* EXCEPT (middle_a, middle_b)) SELECT * FROM insert_select_src;  -- { serverError 47 }
+
+SELECT * FROM insert_select_dst;
+
+DROP TABLE IF EXISTS insert_select_dst;
+DROP TABLE IF EXISTS insert_select_src;

From 34b9547ce1e51c729489f9555d6a60c8c8b7b078 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Sat, 5 Sep 2020 22:12:47 +0800
Subject: [PATCH 160/341] Binary operator monotonicity

---
 src/Functions/FunctionBinaryArithmetic.h      | 186 +++++++++++++++++-
 src/Functions/bitAnd.cpp                      |   2 +-
 src/Functions/bitBoolMaskAnd.cpp              |   2 +-
 src/Functions/bitBoolMaskOr.cpp               |   2 +-
 src/Functions/bitOr.cpp                       |   2 +-
 src/Functions/bitRotateLeft.cpp               |   2 +-
 src/Functions/bitRotateRight.cpp              |   2 +-
 src/Functions/bitShiftLeft.cpp                |   2 +-
 src/Functions/bitShiftRight.cpp               |   2 +-
 src/Functions/bitTest.cpp                     |   2 +-
 src/Functions/bitXor.cpp                      |   2 +-
 src/Functions/divide.cpp                      |   2 +-
 src/Functions/gcd.cpp                         |   2 +-
 src/Functions/intDiv.cpp                      |   2 +-
 src/Functions/intDivOrZero.cpp                |   2 +-
 src/Functions/lcm.cpp                         |   2 +-
 src/Functions/minus.cpp                       |   2 +-
 src/Functions/modulo.cpp                      |   2 +-
 src/Functions/moduloOrZero.cpp                |   2 +-
 src/Functions/multiply.cpp                    |   2 +-
 src/Functions/plus.cpp                        |   2 +-
 src/Storages/MergeTree/KeyCondition.cpp       |  42 +++-
 ...480_binary_operator_monotonicity.reference |   0
 .../01480_binary_operator_monotonicity.sql    |  10 +
 24 files changed, 247 insertions(+), 31 deletions(-)
 create mode 100644 tests/queries/0_stateless/01480_binary_operator_monotonicity.reference
 create mode 100644 tests/queries/0_stateless/01480_binary_operator_monotonicity.sql

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index ca0cc876035..f30b564d677 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -28,6 +28,7 @@
 #include "FunctionFactory.h"
 #include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
+#include <ext/map.h>
 
 #if !defined(ARCADIA_BUILD)
 #    include <Common/config.h>
@@ -51,6 +52,7 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
     extern const int DECIMAL_OVERFLOW;
     extern const int CANNOT_ADD_DIFFERENT_AGGREGATE_STATES;
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
 
@@ -602,7 +604,8 @@ class FunctionBinaryArithmetic : public IFunction
         return castType(left, [&](const auto & left_) { return castType(right, [&](const auto & right_) { return f(left_, right_); }); });
     }
 
-    FunctionOverloadResolverPtr getFunctionForIntervalArithmetic(const DataTypePtr & type0, const DataTypePtr & type1) const
+    static FunctionOverloadResolverPtr
+    getFunctionForIntervalArithmetic(const DataTypePtr & type0, const DataTypePtr & type1, const Context & context)
     {
         bool first_is_date_or_datetime = isDateOrDateTime(type0);
         bool second_is_date_or_datetime = isDateOrDateTime(type1);
@@ -632,7 +635,7 @@ class FunctionBinaryArithmetic : public IFunction
         }
 
         if (second_is_date_or_datetime && is_minus)
-            throw Exception("Wrong order of arguments for function " + getName() + ": argument of type Interval cannot be first.",
+            throw Exception("Wrong order of arguments for function " + String(name) + ": argument of type Interval cannot be first.",
                 ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
 
         std::string function_name;
@@ -651,7 +654,7 @@ class FunctionBinaryArithmetic : public IFunction
         return FunctionFactory::instance().get(function_name, context);
     }
 
-    bool isAggregateMultiply(const DataTypePtr & type0, const DataTypePtr & type1) const
+    static bool isAggregateMultiply(const DataTypePtr & type0, const DataTypePtr & type1)
     {
         if constexpr (!is_multiply)
             return false;
@@ -663,7 +666,7 @@ class FunctionBinaryArithmetic : public IFunction
             || (which0.isNativeUInt() && which1.isAggregateFunction());
     }
 
-    bool isAggregateAddition(const DataTypePtr & type0, const DataTypePtr & type1) const
+    static bool isAggregateAddition(const DataTypePtr & type0, const DataTypePtr & type1)
     {
         if constexpr (!is_plus)
             return false;
@@ -812,6 +815,11 @@ public:
     size_t getNumberOfArguments() const override { return 2; }
 
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        return getReturnTypeImplStatic(arguments, context);
+    }
+
+    static DataTypePtr getReturnTypeImplStatic(const DataTypes & arguments, const Context & context)
     {
         /// Special case when multiply aggregate function state
         if (isAggregateMultiply(arguments[0], arguments[1]))
@@ -832,7 +840,7 @@ public:
         }
 
         /// Special case when the function is plus or minus, one of arguments is Date/DateTime and another is Interval.
-        if (auto function_builder = getFunctionForIntervalArithmetic(arguments[0], arguments[1]))
+        if (auto function_builder = getFunctionForIntervalArithmetic(arguments[0], arguments[1], context))
         {
             ColumnsWithTypeAndName new_arguments(2);
 
@@ -903,7 +911,7 @@ public:
             return false;
         });
         if (!valid)
-            throw Exception("Illegal types " + arguments[0]->getName() + " and " + arguments[1]->getName() + " of arguments of function " + getName(),
+            throw Exception("Illegal types " + arguments[0]->getName() + " and " + arguments[1]->getName() + " of arguments of function " + String(name),
                 ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
         return type_res;
     }
@@ -1110,7 +1118,8 @@ public:
         }
 
         /// Special case when the function is plus or minus, one of arguments is Date/DateTime and another is Interval.
-        if (auto function_builder = getFunctionForIntervalArithmetic(block.getByPosition(arguments[0]).type, block.getByPosition(arguments[1]).type))
+        if (auto function_builder
+            = getFunctionForIntervalArithmetic(block.getByPosition(arguments[0]).type, block.getByPosition(arguments[1]).type, context))
         {
             executeDateTimeIntervalPlusMinus(block, arguments, result, input_rows_count, function_builder);
             return;
@@ -1200,4 +1209,167 @@ public:
     bool canBeExecutedOnDefaultArguments() const override { return valid_on_default_arguments; }
 };
 
+
+template <template <typename, typename> class Op, typename Name, bool valid_on_default_arguments = true>
+class FunctionBinaryArithmeticWithConstants : public FunctionBinaryArithmetic<Op, Name, valid_on_default_arguments>
+{
+public:
+    using Base = FunctionBinaryArithmetic<Op, Name, valid_on_default_arguments>;
+    using Monotonicity = typename Base::Monotonicity;
+    static FunctionPtr create(const ColumnWithTypeAndName & left_, const ColumnWithTypeAndName & right_, const Context & context)
+    {
+        return std::make_shared<FunctionBinaryArithmeticWithConstants>(left_, right_, context);
+    }
+    FunctionBinaryArithmeticWithConstants(
+        const ColumnWithTypeAndName & left_, const ColumnWithTypeAndName & right_, const Context & context_)
+        : Base(context_), left(left_), right(right_)
+    {
+    }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count) const override
+    {
+        if (left.column && isColumnConst(*left.column) && arguments.size() == 1)
+        {
+            Block block_with_constant
+                = {{left.column->cloneResized(input_rows_count), left.type, left.name},
+                   block.getByPosition(arguments[0]),
+                   block.getByPosition(result)};
+            Base::executeImpl(block_with_constant, {0, 1}, 2, input_rows_count);
+            block.getByPosition(result) = block_with_constant.getByPosition(2);
+        }
+        else if (right.column && isColumnConst(*right.column) && arguments.size() == 1)
+        {
+            Block block_with_constant
+                = {block.getByPosition(arguments[0]),
+                   {right.column->cloneResized(input_rows_count), right.type, right.name},
+                   block.getByPosition(result)};
+            Base::executeImpl(block_with_constant, {0, 1}, 2, input_rows_count);
+            block.getByPosition(result) = block_with_constant.getByPosition(2);
+        }
+        else
+            Base::executeImpl(block, arguments, result, input_rows_count);
+    }
+
+    bool hasInformationAboutMonotonicity() const override
+    {
+        std::string_view name_ = Name::name;
+        if (name_ == "minus" || name_ == "plus" || name_ == "multiply" || name_ == "divide" || name_ == "intDiv")
+        {
+            return true;
+        }
+        return false;
+    }
+
+    Monotonicity getMonotonicityForRange(const IDataType &, const Field & left_point, const Field & right_point) const override
+    {
+        std::string_view name_ = Name::name;
+        if (name_ == "minus" || name_ == "plus")
+        {
+            return {true, true, true};
+        }
+        if (name_ == "multiply" || name_ == "divide" || name_ == "intDiv")
+        {
+            if (!left.column)
+            {
+                bool positive = true;
+                if (WhichDataType(right.type).isInt())
+                {
+                    positive = right.column->getInt(0) >= 0;
+                }
+
+                if (WhichDataType(left.type).isUInt())
+                    return {true, positive, true};
+                else if (WhichDataType(left.type).isInt())
+                {
+                    if (left_point.get<Int64>() == right_point.get<Int64>())
+                        return {true, positive, true};
+                    if (left_point.get<Int64>() >= 0)
+                        return {true, positive, false};
+                    else if (right_point.get<Int64>() <= 0)
+                        return {true, !positive, false};
+                    else
+                        return {false, true, false};
+                }
+            }
+            if (!right.column)
+            {
+                bool positive = true;
+                if (WhichDataType(left.type).isInt())
+                {
+                    positive = right.column->getInt(0) >= 0;
+                }
+
+                if (WhichDataType(left.type).isUInt())
+                    return {true, !positive, true};
+                else if (WhichDataType(left.type).isInt())
+                {
+                    if (left_point.get<Int64>() == right_point.get<Int64>())
+                        return {true, !positive, true};
+                    if (left_point.get<Int64>() >= 0)
+                        return {true, !positive, false};
+                    else if (right_point.get<Int64>() <= 0)
+                        return {true, positive, false};
+                    else
+                        return {false, true, false};
+                }
+            }
+            return {true, true, true}; // both arguments are constants
+        }
+        return {false, true, false};
+    }
+
+private:
+    ColumnWithTypeAndName left;
+    ColumnWithTypeAndName right;
+};
+
+
+template <template <typename, typename> class Op, typename Name, bool valid_on_default_arguments = true>
+class BinaryArithmeticOverloadResolver : public IFunctionOverloadResolverImpl
+{
+public:
+    static constexpr auto name = Name::name;
+    static FunctionOverloadResolverImplPtr create(const Context & context)
+    {
+        return std::make_unique<BinaryArithmeticOverloadResolver>(context);
+    }
+
+    explicit BinaryArithmeticOverloadResolver(const Context & context_) : context(context_) {}
+
+    String getName() const override { return name; }
+    size_t getNumberOfArguments() const override { return 2; }
+    bool isVariadic() const override { return false; }
+
+    FunctionBaseImplPtr build(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
+    {
+        /// More efficient specialization for two numeric arguments.
+        if (arguments.size() == 2
+            && ((arguments[0].column && isColumnConst(*arguments[0].column))
+                || (arguments[1].column && isColumnConst(*arguments[1].column))))
+        {
+            return std::make_unique<DefaultFunction>(
+                FunctionBinaryArithmeticWithConstants<Op, Name, valid_on_default_arguments>::create(arguments[0], arguments[1], context),
+                ext::map<DataTypes>(arguments, [](const auto & elem) { return elem.type; }),
+                return_type);
+        }
+
+        return std::make_unique<DefaultFunction>(
+            FunctionBinaryArithmetic<Op, Name, valid_on_default_arguments>::create(context),
+            ext::map<DataTypes>(arguments, [](const auto & elem) { return elem.type; }),
+            return_type);
+    }
+
+    DataTypePtr getReturnType(const DataTypes & arguments) const override
+    {
+        if (arguments.size() != 2)
+            throw Exception(
+                "Number of arguments for function " + getName() + " doesn't match: passed " + toString(arguments.size()) + ", should be 2",
+                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
+        return FunctionBinaryArithmetic<Op, Name, valid_on_default_arguments>::getReturnTypeImplStatic(arguments, context);
+    }
+
+private:
+    const Context & context;
+};
+
 }
diff --git a/src/Functions/bitAnd.cpp b/src/Functions/bitAnd.cpp
index 89c2758bc6a..f02c8fbd4ee 100644
--- a/src/Functions/bitAnd.cpp
+++ b/src/Functions/bitAnd.cpp
@@ -37,7 +37,7 @@ struct BitAndImpl
 };
 
 struct NameBitAnd { static constexpr auto name = "bitAnd"; };
-using FunctionBitAnd = FunctionBinaryArithmetic<BitAndImpl, NameBitAnd, true>;
+using FunctionBitAnd = BinaryArithmeticOverloadResolver<BitAndImpl, NameBitAnd, true>;
 
 }
 
diff --git a/src/Functions/bitBoolMaskAnd.cpp b/src/Functions/bitBoolMaskAnd.cpp
index dd46fa8b1b1..9b0ea85f3fd 100644
--- a/src/Functions/bitBoolMaskAnd.cpp
+++ b/src/Functions/bitBoolMaskAnd.cpp
@@ -42,7 +42,7 @@ struct BitBoolMaskAndImpl
 };
 
 struct NameBitBoolMaskAnd { static constexpr auto name = "__bitBoolMaskAnd"; };
-using FunctionBitBoolMaskAnd = FunctionBinaryArithmetic<BitBoolMaskAndImpl, NameBitBoolMaskAnd>;
+using FunctionBitBoolMaskAnd = BinaryArithmeticOverloadResolver<BitBoolMaskAndImpl, NameBitBoolMaskAnd>;
 
 }
 
diff --git a/src/Functions/bitBoolMaskOr.cpp b/src/Functions/bitBoolMaskOr.cpp
index e86c7dcda8e..d68a54924d0 100644
--- a/src/Functions/bitBoolMaskOr.cpp
+++ b/src/Functions/bitBoolMaskOr.cpp
@@ -42,7 +42,7 @@ struct BitBoolMaskOrImpl
 };
 
 struct NameBitBoolMaskOr { static constexpr auto name = "__bitBoolMaskOr"; };
-using FunctionBitBoolMaskOr = FunctionBinaryArithmetic<BitBoolMaskOrImpl, NameBitBoolMaskOr>;
+using FunctionBitBoolMaskOr = BinaryArithmeticOverloadResolver<BitBoolMaskOrImpl, NameBitBoolMaskOr>;
 
 }
 
diff --git a/src/Functions/bitOr.cpp b/src/Functions/bitOr.cpp
index 0f339b328d8..b3559e13e0e 100644
--- a/src/Functions/bitOr.cpp
+++ b/src/Functions/bitOr.cpp
@@ -36,7 +36,7 @@ struct BitOrImpl
 };
 
 struct NameBitOr { static constexpr auto name = "bitOr"; };
-using FunctionBitOr = FunctionBinaryArithmetic<BitOrImpl, NameBitOr, true>;
+using FunctionBitOr = BinaryArithmeticOverloadResolver<BitOrImpl, NameBitOr, true>;
 
 }
 
diff --git a/src/Functions/bitRotateLeft.cpp b/src/Functions/bitRotateLeft.cpp
index 5d52494eb7d..aac0197f2c5 100644
--- a/src/Functions/bitRotateLeft.cpp
+++ b/src/Functions/bitRotateLeft.cpp
@@ -43,7 +43,7 @@ struct BitRotateLeftImpl
 };
 
 struct NameBitRotateLeft { static constexpr auto name = "bitRotateLeft"; };
-using FunctionBitRotateLeft = FunctionBinaryArithmetic<BitRotateLeftImpl, NameBitRotateLeft>;
+using FunctionBitRotateLeft = BinaryArithmeticOverloadResolver<BitRotateLeftImpl, NameBitRotateLeft>;
 
 }
 
diff --git a/src/Functions/bitRotateRight.cpp b/src/Functions/bitRotateRight.cpp
index 7cda0b4890b..e8932eccaa3 100644
--- a/src/Functions/bitRotateRight.cpp
+++ b/src/Functions/bitRotateRight.cpp
@@ -42,7 +42,7 @@ struct BitRotateRightImpl
 };
 
 struct NameBitRotateRight { static constexpr auto name = "bitRotateRight"; };
-using FunctionBitRotateRight = FunctionBinaryArithmetic<BitRotateRightImpl, NameBitRotateRight>;
+using FunctionBitRotateRight = BinaryArithmeticOverloadResolver<BitRotateRightImpl, NameBitRotateRight>;
 
 }
 
diff --git a/src/Functions/bitShiftLeft.cpp b/src/Functions/bitShiftLeft.cpp
index 59d236ac6af..3df3165a8e6 100644
--- a/src/Functions/bitShiftLeft.cpp
+++ b/src/Functions/bitShiftLeft.cpp
@@ -42,7 +42,7 @@ struct BitShiftLeftImpl
 };
 
 struct NameBitShiftLeft { static constexpr auto name = "bitShiftLeft"; };
-using FunctionBitShiftLeft = FunctionBinaryArithmetic<BitShiftLeftImpl, NameBitShiftLeft>;
+using FunctionBitShiftLeft = BinaryArithmeticOverloadResolver<BitShiftLeftImpl, NameBitShiftLeft>;
 
 }
 
diff --git a/src/Functions/bitShiftRight.cpp b/src/Functions/bitShiftRight.cpp
index fe7def0b56b..da3bd16c4c4 100644
--- a/src/Functions/bitShiftRight.cpp
+++ b/src/Functions/bitShiftRight.cpp
@@ -42,7 +42,7 @@ struct BitShiftRightImpl
 };
 
 struct NameBitShiftRight { static constexpr auto name = "bitShiftRight"; };
-using FunctionBitShiftRight = FunctionBinaryArithmetic<BitShiftRightImpl, NameBitShiftRight>;
+using FunctionBitShiftRight = BinaryArithmeticOverloadResolver<BitShiftRightImpl, NameBitShiftRight>;
 
 }
 
diff --git a/src/Functions/bitTest.cpp b/src/Functions/bitTest.cpp
index 9c9f16d87c4..54c932d9311 100644
--- a/src/Functions/bitTest.cpp
+++ b/src/Functions/bitTest.cpp
@@ -34,7 +34,7 @@ struct BitTestImpl
 };
 
 struct NameBitTest { static constexpr auto name = "bitTest"; };
-using FunctionBitTest = FunctionBinaryArithmetic<BitTestImpl, NameBitTest>;
+using FunctionBitTest = BinaryArithmeticOverloadResolver<BitTestImpl, NameBitTest>;
 
 }
 
diff --git a/src/Functions/bitXor.cpp b/src/Functions/bitXor.cpp
index 3d323fde8bb..9237cb76e59 100644
--- a/src/Functions/bitXor.cpp
+++ b/src/Functions/bitXor.cpp
@@ -36,7 +36,7 @@ struct BitXorImpl
 };
 
 struct NameBitXor { static constexpr auto name = "bitXor"; };
-using FunctionBitXor = FunctionBinaryArithmetic<BitXorImpl, NameBitXor, true>;
+using FunctionBitXor = BinaryArithmeticOverloadResolver<BitXorImpl, NameBitXor, true>;
 
 }
 
diff --git a/src/Functions/divide.cpp b/src/Functions/divide.cpp
index 98bfec08ccd..34ba33effb4 100644
--- a/src/Functions/divide.cpp
+++ b/src/Functions/divide.cpp
@@ -37,7 +37,7 @@ struct DivideFloatingImpl
 };
 
 struct NameDivide { static constexpr auto name = "divide"; };
-using FunctionDivide = FunctionBinaryArithmetic<DivideFloatingImpl, NameDivide>;
+using FunctionDivide = BinaryArithmeticOverloadResolver<DivideFloatingImpl, NameDivide>;
 
 void registerFunctionDivide(FunctionFactory & factory)
 {
diff --git a/src/Functions/gcd.cpp b/src/Functions/gcd.cpp
index 244b25b194d..7c8a28c83f6 100644
--- a/src/Functions/gcd.cpp
+++ b/src/Functions/gcd.cpp
@@ -40,7 +40,7 @@ struct GCDImpl
 };
 
 struct NameGCD { static constexpr auto name = "gcd"; };
-using FunctionGCD = FunctionBinaryArithmetic<GCDImpl, NameGCD, false>;
+using FunctionGCD = BinaryArithmeticOverloadResolver<GCDImpl, NameGCD, false>;
 
 }
 
diff --git a/src/Functions/intDiv.cpp b/src/Functions/intDiv.cpp
index a08525813b1..45fb8bd51bd 100644
--- a/src/Functions/intDiv.cpp
+++ b/src/Functions/intDiv.cpp
@@ -110,7 +110,7 @@ template <> struct BinaryOperationImpl<Int32, Int64, DivideIntegralImpl<Int32, I
 
 
 struct NameIntDiv { static constexpr auto name = "intDiv"; };
-using FunctionIntDiv = FunctionBinaryArithmetic<DivideIntegralImpl, NameIntDiv, false>;
+using FunctionIntDiv = BinaryArithmeticOverloadResolver<DivideIntegralImpl, NameIntDiv, false>;
 
 void registerFunctionIntDiv(FunctionFactory & factory)
 {
diff --git a/src/Functions/intDivOrZero.cpp b/src/Functions/intDivOrZero.cpp
index 64b6994d438..e44d53244cb 100644
--- a/src/Functions/intDivOrZero.cpp
+++ b/src/Functions/intDivOrZero.cpp
@@ -26,7 +26,7 @@ struct DivideIntegralOrZeroImpl
 };
 
 struct NameIntDivOrZero { static constexpr auto name = "intDivOrZero"; };
-using FunctionIntDivOrZero = FunctionBinaryArithmetic<DivideIntegralOrZeroImpl, NameIntDivOrZero>;
+using FunctionIntDivOrZero = BinaryArithmeticOverloadResolver<DivideIntegralOrZeroImpl, NameIntDivOrZero>;
 
 void registerFunctionIntDivOrZero(FunctionFactory & factory)
 {
diff --git a/src/Functions/lcm.cpp b/src/Functions/lcm.cpp
index 06e8d7d89f4..81406861c52 100644
--- a/src/Functions/lcm.cpp
+++ b/src/Functions/lcm.cpp
@@ -78,7 +78,7 @@ struct LCMImpl
 };
 
 struct NameLCM { static constexpr auto name = "lcm"; };
-using FunctionLCM = FunctionBinaryArithmetic<LCMImpl, NameLCM, false>;
+using FunctionLCM = BinaryArithmeticOverloadResolver<LCMImpl, NameLCM, false>;
 
 }
 
diff --git a/src/Functions/minus.cpp b/src/Functions/minus.cpp
index e362855c206..edee792a55a 100644
--- a/src/Functions/minus.cpp
+++ b/src/Functions/minus.cpp
@@ -43,7 +43,7 @@ struct MinusImpl
 };
 
 struct NameMinus { static constexpr auto name = "minus"; };
-using FunctionMinus = FunctionBinaryArithmetic<MinusImpl, NameMinus>;
+using FunctionMinus = BinaryArithmeticOverloadResolver<MinusImpl, NameMinus>;
 
 void registerFunctionMinus(FunctionFactory & factory)
 {
diff --git a/src/Functions/modulo.cpp b/src/Functions/modulo.cpp
index a8ad15c3971..2f9bf8a9c3a 100644
--- a/src/Functions/modulo.cpp
+++ b/src/Functions/modulo.cpp
@@ -101,7 +101,7 @@ template <> struct BinaryOperationImpl<Int32, Int64, ModuloImpl<Int32, Int64>> :
 
 
 struct NameModulo { static constexpr auto name = "modulo"; };
-using FunctionModulo = FunctionBinaryArithmetic<ModuloImpl, NameModulo, false>;
+using FunctionModulo = BinaryArithmeticOverloadResolver<ModuloImpl, NameModulo, false>;
 
 void registerFunctionModulo(FunctionFactory & factory)
 {
diff --git a/src/Functions/moduloOrZero.cpp b/src/Functions/moduloOrZero.cpp
index 1392b0294bb..4143266518a 100644
--- a/src/Functions/moduloOrZero.cpp
+++ b/src/Functions/moduloOrZero.cpp
@@ -36,7 +36,7 @@ struct ModuloOrZeroImpl
 };
 
 struct NameModuloOrZero { static constexpr auto name = "moduloOrZero"; };
-using FunctionModuloOrZero = FunctionBinaryArithmetic<ModuloOrZeroImpl, NameModuloOrZero>;
+using FunctionModuloOrZero = BinaryArithmeticOverloadResolver<ModuloOrZeroImpl, NameModuloOrZero>;
 
 }
 
diff --git a/src/Functions/multiply.cpp b/src/Functions/multiply.cpp
index 62cbdb49ffb..7552af7dbf1 100644
--- a/src/Functions/multiply.cpp
+++ b/src/Functions/multiply.cpp
@@ -43,7 +43,7 @@ struct MultiplyImpl
 };
 
 struct NameMultiply { static constexpr auto name = "multiply"; };
-using FunctionMultiply = FunctionBinaryArithmetic<MultiplyImpl, NameMultiply>;
+using FunctionMultiply = BinaryArithmeticOverloadResolver<MultiplyImpl, NameMultiply>;
 
 void registerFunctionMultiply(FunctionFactory & factory)
 {
diff --git a/src/Functions/plus.cpp b/src/Functions/plus.cpp
index 16b5bfba309..68b364a7abe 100644
--- a/src/Functions/plus.cpp
+++ b/src/Functions/plus.cpp
@@ -45,7 +45,7 @@ struct PlusImpl
 };
 
 struct NamePlus { static constexpr auto name = "plus"; };
-using FunctionPlus = FunctionBinaryArithmetic<PlusImpl, NamePlus>;
+using FunctionPlus = BinaryArithmeticOverloadResolver<PlusImpl, NamePlus>;
 
 void registerFunctionPlus(FunctionFactory & factory)
 {
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index 1ce9b9c9527..4d217e02d1a 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -1,6 +1,7 @@
 #include <Storages/MergeTree/KeyCondition.h>
 #include <Storages/MergeTree/BoolMask.h>
 #include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/FieldToDataType.h>
 #include <Interpreters/TreeRewriter.h>
 #include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/ExpressionActions.h>
@@ -711,8 +712,26 @@ bool KeyCondition::isKeyPossiblyWrappedByMonotonicFunctions(
 
     for (auto it = chain_not_tested_for_monotonicity.rbegin(); it != chain_not_tested_for_monotonicity.rend(); ++it)
     {
+        const auto & args = (*it)->arguments->children;
         auto func_builder = FunctionFactory::instance().tryGet((*it)->name, context);
-        ColumnsWithTypeAndName arguments{{ nullptr, key_column_type, "" }};
+        ColumnsWithTypeAndName arguments;
+        if (args.size() == 2)
+        {
+            if (const auto * arg_left = args[0]->as<ASTLiteral>())
+            {
+                auto left_arg_type = applyVisitor(FieldToDataType(), arg_left->value);
+                arguments.push_back({ left_arg_type->createColumnConst(0, arg_left->value), left_arg_type, "" });
+                arguments.push_back({ nullptr, key_column_type, "" });
+            }
+            else if (const auto * arg_right = args[1]->as<ASTLiteral>())
+            {
+                arguments.push_back({ nullptr, key_column_type, "" });
+                auto right_arg_type = applyVisitor(FieldToDataType(), arg_right->value);
+                arguments.push_back({ right_arg_type->createColumnConst(0, arg_right->value), right_arg_type, "" });
+            }
+        }
+        else
+            arguments.push_back({ nullptr, key_column_type, "" });
         auto func = func_builder->build(arguments);
 
         if (!func || !func->hasInformationAboutMonotonicity())
@@ -750,12 +769,27 @@ bool KeyCondition::isKeyPossiblyWrappedByMonotonicFunctionsImpl(
     if (const auto * func = node->as<ASTFunction>())
     {
         const auto & args = func->arguments->children;
-        if (args.size() != 1)
+        if (args.size() > 2)
             return false;
 
         out_functions_chain.push_back(func);
-
-        return isKeyPossiblyWrappedByMonotonicFunctionsImpl(args[0], out_key_column_num, out_key_column_type, out_functions_chain);
+        bool ret = false;
+        if (args.size() == 2)
+        {
+            if (args[0]->as<ASTLiteral>())
+            {
+                ret = isKeyPossiblyWrappedByMonotonicFunctionsImpl(args[1], out_key_column_num, out_key_column_type, out_functions_chain);
+            }
+            else if (args[1]->as<ASTLiteral>())
+            {
+                ret = isKeyPossiblyWrappedByMonotonicFunctionsImpl(args[0], out_key_column_num, out_key_column_type, out_functions_chain);
+            }
+        }
+        else
+        {
+            ret = isKeyPossiblyWrappedByMonotonicFunctionsImpl(args[0], out_key_column_num, out_key_column_type, out_functions_chain);
+        }
+        return ret;
     }
 
     return false;
diff --git a/tests/queries/0_stateless/01480_binary_operator_monotonicity.reference b/tests/queries/0_stateless/01480_binary_operator_monotonicity.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/01480_binary_operator_monotonicity.sql b/tests/queries/0_stateless/01480_binary_operator_monotonicity.sql
new file mode 100644
index 00000000000..bfaab3abd3c
--- /dev/null
+++ b/tests/queries/0_stateless/01480_binary_operator_monotonicity.sql
@@ -0,0 +1,10 @@
+DROP TABLE IF EXISTS binary_op_mono;
+
+CREATE TABLE binary_op_mono(i int, j int) ENGINE MergeTree PARTITION BY toDate(i / 1000) ORDER BY j;
+
+INSERT INTO binary_op_mono VALUES (toUnixTimestamp('2020-09-01 00:00:00') * 1000, 1), (toUnixTimestamp('2020-09-01 00:00:00') * 1000, 2);
+
+SET max_rows_to_read = 1;
+SELECT * FROM binary_op_mono WHERE toDate(i / 1000) = '2020-09-02';
+
+DROP TABLE IF EXISTS binary_op_mono;

From 72786c81307635c8ad3294de265fb9f33dcb3fc9 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Thu, 10 Sep 2020 18:42:32 +0800
Subject: [PATCH 161/341] Take arithmetic overflow into consideration

---
 src/Functions/FunctionBinaryArithmetic.h | 153 ++++++++++++++++-------
 1 file changed, 108 insertions(+), 45 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index f30b564d677..cffcdc88dd6 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -28,6 +28,8 @@
 #include "FunctionFactory.h"
 #include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
+#include <Common/FieldVisitors.h>
+#include <Common/FieldVisitorsAccurateComparison.h>
 #include <ext/map.h>
 
 #if !defined(ARCADIA_BUILD)
@@ -1216,13 +1218,22 @@ class FunctionBinaryArithmeticWithConstants : public FunctionBinaryArithmetic<Op
 public:
     using Base = FunctionBinaryArithmetic<Op, Name, valid_on_default_arguments>;
     using Monotonicity = typename Base::Monotonicity;
-    static FunctionPtr create(const ColumnWithTypeAndName & left_, const ColumnWithTypeAndName & right_, const Context & context)
+
+    static FunctionPtr create(
+        const ColumnWithTypeAndName & left_,
+        const ColumnWithTypeAndName & right_,
+        const DataTypePtr & return_type_,
+        const Context & context)
     {
-        return std::make_shared<FunctionBinaryArithmeticWithConstants>(left_, right_, context);
+        return std::make_shared<FunctionBinaryArithmeticWithConstants>(left_, right_, return_type_, context);
     }
+
     FunctionBinaryArithmeticWithConstants(
-        const ColumnWithTypeAndName & left_, const ColumnWithTypeAndName & right_, const Context & context_)
-        : Base(context_), left(left_), right(right_)
+        const ColumnWithTypeAndName & left_,
+        const ColumnWithTypeAndName & right_,
+        const DataTypePtr & return_type_,
+        const Context & context_)
+        : Base(context_), left(left_), right(right_), return_type(return_type_)
     {
     }
 
@@ -1253,7 +1264,7 @@ public:
     bool hasInformationAboutMonotonicity() const override
     {
         std::string_view name_ = Name::name;
-        if (name_ == "minus" || name_ == "plus" || name_ == "multiply" || name_ == "divide" || name_ == "intDiv")
+        if (name_ == "minus" || name_ == "plus" || name_ == "divide" || name_ == "intDiv")
         {
             return true;
         }
@@ -1262,58 +1273,108 @@ public:
 
     Monotonicity getMonotonicityForRange(const IDataType &, const Field & left_point, const Field & right_point) const override
     {
+        // For simplicity, we treat null values as monotonicity breakers.
+        if (left_point.isNull() || right_point.isNull())
+            return {false, true, false};
+
+        // For simplicity, we treat every single value interval as positive monotonic.
+        if (applyVisitor(FieldVisitorAccurateEquals(), left_point, right_point))
+            return {true, true, false};
+
         std::string_view name_ = Name::name;
         if (name_ == "minus" || name_ == "plus")
         {
-            return {true, true, true};
+            // const +|- variable
+            if (left.column && isColumnConst(*left.column))
+            {
+                auto transform = [&](const Field & point)
+                {
+                    Block block_with_constant
+                        = {{left.column->cloneResized(1), left.type, left.name},
+                           {right.type->createColumnConst(1, point), right.type, right.name},
+                           {nullptr, return_type, ""}};
+                    Base::executeImpl(block_with_constant, {0, 1}, 2, 1);
+                    Field point_transformed;
+                    block_with_constant.getByPosition(2).column->get(0, point_transformed);
+                    return point_transformed;
+                };
+                transform(left_point);
+                transform(right_point);
+                if (name_ == "plus")
+                {
+                    // Check if there is an overflow
+                    if (applyVisitor(FieldVisitorAccurateLess(), left_point, right_point)
+                            == applyVisitor(FieldVisitorAccurateLess(), transform(left_point), transform(right_point)))
+                        return {true, true, false};
+                    else
+                        return {false, true, false};
+                }
+                else
+                {
+                    // Check if there is an overflow
+                    if (applyVisitor(FieldVisitorAccurateLess(), left_point, right_point)
+                            != applyVisitor(FieldVisitorAccurateLess(), transform(left_point), transform(right_point)))
+                        return {true, false, false};
+                    else
+                        return {false, false, false};
+                }
+            }
+            // variable +|- constant
+            else if (right.column && isColumnConst(*right.column))
+            {
+                auto transform = [&](const Field & point)
+                {
+                    Block block_with_constant
+                        = {{left.type->createColumnConst(1, point), left.type, left.name},
+                           {right.column->cloneResized(1), right.type, right.name},
+                           {nullptr, return_type, ""}};
+                    Base::executeImpl(block_with_constant, {0, 1}, 2, 1);
+                    Field point_transformed;
+                    block_with_constant.getByPosition(2).column->get(0, point_transformed);
+                    return point_transformed;
+                };
+
+                // Check if there is an overflow
+                if (applyVisitor(FieldVisitorAccurateLess(), left_point, right_point)
+                    == applyVisitor(FieldVisitorAccurateLess(), transform(left_point), transform(right_point)))
+                    return {true, true, false};
+                else
+                    return {false, true, false};
+            }
         }
-        if (name_ == "multiply" || name_ == "divide" || name_ == "intDiv")
+        if (name_ == "divide" || name_ == "intDiv")
         {
-            if (!left.column)
+            // const / variable
+            if (left.column && isColumnConst(*left.column))
             {
-                bool positive = true;
-                if (WhichDataType(right.type).isInt())
-                {
-                    positive = right.column->getInt(0) >= 0;
-                }
+                auto constant = (*left.column)[0];
+                if (applyVisitor(FieldVisitorAccurateEquals(), constant, Field(0)))
+                    return {true, true, false}; // 0 / 0 is undefined, thus it's not always monotonic
 
-                if (WhichDataType(left.type).isUInt())
-                    return {true, positive, true};
-                else if (WhichDataType(left.type).isInt())
+                bool is_constant_positive = applyVisitor(FieldVisitorAccurateLess(), Field(0), constant);
+                if (applyVisitor(FieldVisitorAccurateLess(), left_point, Field(0)) &&
+                        applyVisitor(FieldVisitorAccurateLess(), right_point, Field(0)))
                 {
-                    if (left_point.get<Int64>() == right_point.get<Int64>())
-                        return {true, positive, true};
-                    if (left_point.get<Int64>() >= 0)
-                        return {true, positive, false};
-                    else if (right_point.get<Int64>() <= 0)
-                        return {true, !positive, false};
-                    else
-                        return {false, true, false};
+                    return {true, is_constant_positive, false};
+                }
+                else
+                if (applyVisitor(FieldVisitorAccurateLess(), Field(0), left_point) &&
+                        applyVisitor(FieldVisitorAccurateLess(), Field(0), right_point))
+                {
+                    return {true, !is_constant_positive, false};
                 }
             }
-            if (!right.column)
+            // variable / constant
+            else if (right.column && isColumnConst(*right.column))
             {
-                bool positive = true;
-                if (WhichDataType(left.type).isInt())
-                {
-                    positive = right.column->getInt(0) >= 0;
-                }
+                auto constant = (*left.column)[0];
+                if (applyVisitor(FieldVisitorAccurateEquals(), constant, Field(0)))
+                    return {false, true, false}; // variable / 0 is undefined, let's treat it as non-monotonic
 
-                if (WhichDataType(left.type).isUInt())
-                    return {true, !positive, true};
-                else if (WhichDataType(left.type).isInt())
-                {
-                    if (left_point.get<Int64>() == right_point.get<Int64>())
-                        return {true, !positive, true};
-                    if (left_point.get<Int64>() >= 0)
-                        return {true, !positive, false};
-                    else if (right_point.get<Int64>() <= 0)
-                        return {true, positive, false};
-                    else
-                        return {false, true, false};
-                }
+                bool is_constant_positive = applyVisitor(FieldVisitorAccurateLess(), Field(0), constant);
+                // division is saturated to `inf`, thus it doesn't have overflow issues.
+                return {true, is_constant_positive, false};
             }
-            return {true, true, true}; // both arguments are constants
         }
         return {false, true, false};
     }
@@ -1321,6 +1382,7 @@ public:
 private:
     ColumnWithTypeAndName left;
     ColumnWithTypeAndName right;
+    DataTypePtr return_type;
 };
 
 
@@ -1348,7 +1410,8 @@ public:
                 || (arguments[1].column && isColumnConst(*arguments[1].column))))
         {
             return std::make_unique<DefaultFunction>(
-                FunctionBinaryArithmeticWithConstants<Op, Name, valid_on_default_arguments>::create(arguments[0], arguments[1], context),
+                FunctionBinaryArithmeticWithConstants<Op, Name, valid_on_default_arguments>::create(
+                    arguments[0], arguments[1], return_type, context),
                 ext::map<DataTypes>(arguments, [](const auto & elem) { return elem.type; }),
                 return_type);
         }

From 5cc8fd395c115a7daad89a0c006e2fd6f3336dc0 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Sun, 13 Sep 2020 21:19:02 +0800
Subject: [PATCH 162/341] Fix empty key segfault

---
 src/Storages/MergeTree/KeyCondition.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index 4d217e02d1a..bd45d970a7c 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -769,7 +769,7 @@ bool KeyCondition::isKeyPossiblyWrappedByMonotonicFunctionsImpl(
     if (const auto * func = node->as<ASTFunction>())
     {
         const auto & args = func->arguments->children;
-        if (args.size() > 2)
+        if (args.size() > 2 || args.empty())
             return false;
 
         out_functions_chain.push_back(func);

From f2293d5d1751271bd80cd37a73e452c439658ed5 Mon Sep 17 00:00:00 2001
From: Vxider <lb@vxider.com>
Date: Mon, 14 Sep 2020 12:29:25 +0800
Subject: [PATCH 163/341] update translation

---
 docs/zh/sql-reference/table-functions/remote.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/zh/sql-reference/table-functions/remote.md b/docs/zh/sql-reference/table-functions/remote.md
index 3ec1da3cd2c..a7fa228cbbd 100644
--- a/docs/zh/sql-reference/table-functions/remote.md
+++ b/docs/zh/sql-reference/table-functions/remote.md
@@ -73,6 +73,6 @@ example01-{01..02}-{1|2}
 如果未指定用户, 将会使用`default`。
 如果未指定密码，则使用空密码。
 
-`remoteSecure` - 与 `remote` 相同，但是会使用加密链接。默认端口 — [tcp\_port\_secure](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-tcp_port_secure) 配置文件或或9440.
+`remoteSecure` - 与 `remote` 相同，但是会使用加密链接。默认端口为配置文件中的[tcp\_port\_secure](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-tcp_port_secure)，或9440。
 
 [原始文章](https://clickhouse.tech/docs/en/query_language/table_functions/remote/) <!--hide-->

From 631fa3a28b62ae72305d08e81ba7bb1552f51b85 Mon Sep 17 00:00:00 2001
From: Denis Zhuravlev <deniszhuravlov@gmail.com>
Date: Mon, 14 Sep 2020 02:14:53 -0300
Subject: [PATCH 164/341] drop.md sync russian doc. with eng. (#14780)

---
 docs/ru/sql-reference/statements/drop.md | 32 +++++++++++++++++++++---
 1 file changed, 29 insertions(+), 3 deletions(-)

diff --git a/docs/ru/sql-reference/statements/drop.md b/docs/ru/sql-reference/statements/drop.md
index 4bfd53b1d47..22e553cfdac 100644
--- a/docs/ru/sql-reference/statements/drop.md
+++ b/docs/ru/sql-reference/statements/drop.md
@@ -5,18 +5,35 @@ toc_title: DROP
 
 # DROP {#drop}
 
-Запрос имеет два вида: `DROP DATABASE` и `DROP TABLE`.
+Удаляет существующий объект. 
+Если указано `IF EXISTS` - не выдавать ошибку, если объекта не существует.
+
+## DROP DATABASE {#drop-database}
 
 ``` sql
 DROP DATABASE [IF EXISTS] db [ON CLUSTER cluster]
 ```
 
+Удаляет все таблицы в базе данных db, затем удаляет саму базу данных db.
+
+
+## DROP TABLE {#drop-table}
+
 ``` sql
 DROP [TEMPORARY] TABLE [IF EXISTS] [db.]name [ON CLUSTER cluster]
 ```
 
 Удаляет таблицу.
-Если указано `IF EXISTS` - не выдавать ошибку, если таблица не существует или база данных не существует.
+
+
+## DROP DICTIONARY {#drop-dictionary}
+
+``` sql
+DROP DICTIONARY [IF EXISTS] [db.]name
+```
+
+Удаляет словарь.
+
 
 ## DROP USER {#drop-user-statement}
 
@@ -41,6 +58,7 @@ DROP USER [IF EXISTS] name [,...] [ON CLUSTER cluster_name]
 DROP ROLE [IF EXISTS] name [,...] [ON CLUSTER cluster_name]
 ```
 
+
 ## DROP ROW POLICY {#drop-row-policy-statement}
 
 Удаляет политику доступа к строкам.
@@ -80,5 +98,13 @@ DROP [SETTINGS] PROFILE [IF EXISTS] name [,...] [ON CLUSTER cluster_name]
 ```
 
 
+## DROP VIEW {#drop-view}
 
-[Оригинальная статья](https://clickhouse.tech/docs/ru/sql-reference/statements/drop/) <!--hide-->
\ No newline at end of file
+``` sql
+DROP VIEW [IF EXISTS] [db.]name [ON CLUSTER cluster]
+```
+
+Удаляет представление. Представления могут быть удалены и командой `DROP TABLE`, но команда `DROP VIEW` проверяет, что `[db.]name` является представлением.
+
+
+[Оригинальная статья](https://clickhouse.tech/docs/ru/sql-reference/statements/drop/) <!--hide-->

From d8a7fd2428a5c198a2afcd1a4481ec8749992a11 Mon Sep 17 00:00:00 2001
From: Denis Zhuravlev <deniszhuravlov@gmail.com>
Date: Mon, 14 Sep 2020 02:15:54 -0300
Subject: [PATCH 165/341] view.md sync russian doc with eng. (#14779)

---
 .../sql-reference/statements/create/view.md   | 29 +++++++++++++------
 1 file changed, 20 insertions(+), 9 deletions(-)

diff --git a/docs/ru/sql-reference/statements/create/view.md b/docs/ru/sql-reference/statements/create/view.md
index 36a7a3c51e2..caa3d04659e 100644
--- a/docs/ru/sql-reference/statements/create/view.md
+++ b/docs/ru/sql-reference/statements/create/view.md
@@ -5,13 +5,15 @@ toc_title: Представление
 
 # CREATE VIEW {#create-view}
 
-``` sql
-CREATE [MATERIALIZED] VIEW [IF NOT EXISTS] [db.]table_name [TO[db.]name] [ENGINE = engine] [POPULATE] AS SELECT ...
-```
-
 Создаёт представление. Представления бывают двух видов - обычные и материализованные (MATERIALIZED).
 
-Обычные представления не хранят никаких данных, а всего лишь производят чтение из другой таблицы. То есть, обычное представление - не более чем сохранённый запрос. При чтении из представления, этот сохранённый запрос, используется в качестве подзапроса в секции FROM.
+## Обычные представления {#normal}
+
+``` sql
+CREATE [OR REPLACE] VIEW [IF NOT EXISTS] [db.]table_name [ON CLUSTER] AS SELECT ...
+```
+
+Normal views don’t store any data, they just perform a read from another table on each access. In other words, a normal view is nothing more than a saved query. When reading from a view, this saved query is used as a subquery in the [FROM](../../../sql-reference/statements/select/from.md) clause.
 
 Для примера, пусть вы создали представление:
 
@@ -31,15 +33,24 @@ SELECT a, b, c FROM view
 SELECT a, b, c FROM (SELECT ...)
 ```
 
-Материализованные (MATERIALIZED) представления хранят данные, преобразованные соответствующим запросом SELECT.
+## Материализованные представления {#materialized}
 
-При создании материализованного представления без использования `TO [db].[table]`, нужно обязательно указать ENGINE - движок таблицы для хранения данных.
+``` sql
+CREATE MATERIALIZED VIEW [IF NOT EXISTS] [db.]table_name [ON CLUSTER] [TO[db.]name] [ENGINE = engine] [POPULATE] AS SELECT ...
+```
+
+Материализованные (MATERIALIZED) представления хранят данные, преобразованные соответствующим запросом [SELECT](../../../sql-reference/statements/select/index.md).
+
+При создании материализованного представления без использования `TO [db].[table]`, нужно обязательно указать `ENGINE` - движок таблицы для хранения данных.
 
 При создании материализованного представления с испольованием `TO [db].[table]`, нельзя указывать `POPULATE`
 
 Материализованное представление устроено следующим образом: при вставке данных в таблицу, указанную в SELECT-е, кусок вставляемых данных преобразуется этим запросом SELECT, и полученный результат вставляется в представление.
 
-Если указано POPULATE, то при создании представления, в него будут вставлены имеющиеся данные таблицы, как если бы был сделан запрос `CREATE TABLE ... AS SELECT ...` . Иначе, представление будет содержать только данные, вставляемые в таблицу после создания представления. Не рекомендуется использовать POPULATE, так как вставляемые в таблицу данные во время создания представления, не попадут в него.
+!!! important "Важно"
+    Материализованные представлени в ClickHouse больше похожи на `after insert` триггеры. Если в запросе материализованного представления есть агрегирование, оно применяется только к вставляемому блоку записей. Любые изменения существующих данных исходной таблицы (например обновление, удаление, удаление раздела и т.д.) не изменяют материализованное представление.
+
+Если указано `POPULATE`, то при создании представления, в него будут вставлены имеющиеся данные таблицы, как если бы был сделан запрос `CREATE TABLE ... AS SELECT ...` . Иначе, представление будет содержать только данные, вставляемые в таблицу после создания представления. Не рекомендуется использовать POPULATE, так как вставляемые в таблицу данные во время создания представления, не попадут в него.
 
 Запрос `SELECT` может содержать `DISTINCT`, `GROUP BY`, `ORDER BY`, `LIMIT`… Следует иметь ввиду, что соответствующие преобразования будут выполняться независимо, на каждый блок вставляемых данных. Например, при наличии `GROUP BY`, данные будут агрегироваться при вставке, но только в рамках одной пачки вставляемых данных. Далее, данные не будут доагрегированы. Исключение - использование ENGINE, производящего агрегацию данных самостоятельно, например, `SummingMergeTree`.
 
@@ -50,4 +61,4 @@ SELECT a, b, c FROM (SELECT ...)
 Отсутствует отдельный запрос для удаления представлений. Чтобы удалить представление, следует использовать `DROP TABLE`.
 
 [Оригинальная статья](https://clickhouse.tech/docs/ru/sql-reference/statements/create/view) 
-<!--hide-->
\ No newline at end of file
+<!--hide-->

From 3e00d64ebf38218a3210b8be42f73858bbb804c4 Mon Sep 17 00:00:00 2001
From: rodrigargar <rgarcia.garcia@gmail.com>
Date: Mon, 14 Sep 2020 07:17:23 +0200
Subject: [PATCH 166/341] Update backup.md (#14702)

* Update backup.md

Fix most of the first paragraph that was left untranslated and other minor fixes.

* Update backup.md

Co-authored-by: Ivan Blinkov <github@blinkov.ru>
---
 docs/es/operations/backup.md | 10 ++++------
 1 file changed, 4 insertions(+), 6 deletions(-)

diff --git a/docs/es/operations/backup.md b/docs/es/operations/backup.md
index f1e5b3d3e09..a6297070663 100644
--- a/docs/es/operations/backup.md
+++ b/docs/es/operations/backup.md
@@ -1,20 +1,18 @@
 ---
-machine_translated: true
-machine_translated_rev: 72537a2d527c63c07aa5d2361a8829f3895cf2bd
 toc_priority: 49
 toc_title: Copia de seguridad de datos
 ---
 
 # Copia de seguridad de datos {#data-backup}
 
-Mientras [replicación](../engines/table-engines/mergetree-family/replication.md) provides protection from hardware failures, it does not protect against human errors: accidental deletion of data, deletion of the wrong table or a table on the wrong cluster, and software bugs that result in incorrect data processing or data corruption. In many cases mistakes like these will affect all replicas. ClickHouse has built-in safeguards to prevent some types of mistakes — for example, by default [no puede simplemente eliminar tablas con un motor similar a MergeTree que contenga más de 50 Gb de datos](https://github.com/ClickHouse/ClickHouse/blob/v18.14.18-stable/programs/server/config.xml#L322-L330). Sin embargo, estas garantías no cubren todos los casos posibles y pueden eludirse.
+Mientras que la [replicación](../engines/table-engines/mergetree-family/replication.md) proporciona protección contra fallos de hardware, no protege de errores humanos: el borrado accidental de datos, elminar la tabla equivocada o una tabla en el clúster equivocado, y bugs de software que dan como resultado un procesado incorrecto de los datos o la corrupción de los datos. En muchos casos, errores como estos afectarán a todas las réplicas. ClickHouse dispone de salvaguardas para prevenir algunos tipos de errores — por ejemplo, por defecto [no se puede simplemente eliminar tablas con un motor similar a MergeTree que contenga más de 50 Gb de datos](https://github.com/ClickHouse/ClickHouse/blob/v18.14.18-stable/programs/server/config.xml#L322-L330). Sin embargo, estas salvaguardas no cubren todos los casos posibles y pueden eludirse.
 
 Para mitigar eficazmente los posibles errores humanos, debe preparar cuidadosamente una estrategia para realizar copias de seguridad y restaurar sus datos **previamente**.
 
-Cada empresa tiene diferentes recursos disponibles y requisitos comerciales, por lo que no existe una solución universal para las copias de seguridad y restauraciones de ClickHouse que se adapten a cada situación. Lo que funciona para un gigabyte de datos probablemente no funcionará para decenas de petabytes. Hay una variedad de posibles enfoques con sus propios pros y contras, que se discutirán a continuación. Es una buena idea utilizar varios enfoques en lugar de solo uno para compensar sus diversas deficiencias.
+Cada empresa tiene diferentes recursos disponibles y requisitos comerciales, por lo que no existe una solución universal para las copias de seguridad y restauraciones de ClickHouse que se adapten a cada situación. Lo que funciona para un gigabyte de datos probablemente no funcionará para decenas de petabytes. Hay una variedad de posibles enfoques con sus propios pros y contras, que se discutirán a continuación. Es una buena idea utilizar varios enfoques en lugar de uno solo para compensar sus diversas deficiencias.
 
 !!! note "Nota"
-    Tenga en cuenta que si realizó una copia de seguridad de algo y nunca intentó restaurarlo, es probable que la restauración no funcione correctamente cuando realmente la necesite (o al menos tomará más tiempo de lo que las empresas pueden tolerar). Por lo tanto, cualquiera que sea el enfoque de copia de seguridad que elija, asegúrese de automatizar el proceso de restauración también y practicarlo en un clúster de ClickHouse de repuesto regularmente.
+    Tenga en cuenta que si realizó una copia de seguridad de algo y nunca intentó restaurarlo, es probable que la restauración no funcione correctamente cuando realmente la necesite (o al menos tomará más tiempo de lo que las empresas pueden tolerar). Por lo tanto, cualquiera que sea el enfoque de copia de seguridad que elija, asegúrese de automatizar el proceso de restauración también y ponerlo en practica en un clúster de ClickHouse de repuesto regularmente.
 
 ## Duplicar datos de origen en otro lugar {#duplicating-source-data-somewhere-else}
 
@@ -32,7 +30,7 @@ Para volúmenes de datos más pequeños, un simple `INSERT INTO ... SELECT ...`
 
 ## Manipulaciones con piezas {#manipulations-with-parts}
 
-ClickHouse permite usar el `ALTER TABLE ... FREEZE PARTITION ...` consulta para crear una copia local de particiones de tabla. Esto se implementa utilizando enlaces duros al `/var/lib/clickhouse/shadow/` carpeta, por lo que generalmente no consume espacio adicional en disco para datos antiguos. Las copias creadas de archivos no son manejadas por el servidor ClickHouse, por lo que puede dejarlas allí: tendrá una copia de seguridad simple que no requiere ningún sistema externo adicional, pero seguirá siendo propenso a problemas de hardware. Por esta razón, es mejor copiarlos de forma remota en otra ubicación y luego eliminar las copias locales. Los sistemas de archivos distribuidos y los almacenes de objetos siguen siendo una buena opción para esto, pero los servidores de archivos conectados normales con una capacidad lo suficientemente grande podrían funcionar también (en este caso, la transferencia ocurrirá a través del sistema de archivos de red o tal vez [rsync](https://en.wikipedia.org/wiki/Rsync)).
+ClickHouse permite usar la consulta `ALTER TABLE ... FREEZE PARTITION ...` para crear una copia local de particiones de tabla. Esto se implementa utilizando enlaces duros a la carpeta `/var/lib/clickhouse/shadow/`, por lo que generalmente no consume espacio adicional en disco para datos antiguos. Las copias creadas de archivos no son manejadas por el servidor ClickHouse, por lo que puede dejarlas allí: tendrá una copia de seguridad simple que no requiere ningún sistema externo adicional, pero seguirá siendo propenso a problemas de hardware. Por esta razón, es mejor copiarlos de forma remota en otra ubicación y luego eliminar las copias locales. Los sistemas de archivos distribuidos y los almacenes de objetos siguen siendo una buena opción para esto, pero los servidores de archivos conectados normales con una capacidad lo suficientemente grande podrían funcionar también (en este caso, la transferencia ocurrirá a través del sistema de archivos de red o tal vez [rsync](https://en.wikipedia.org/wiki/Rsync)).
 
 Para obtener más información sobre las consultas relacionadas con las manipulaciones de particiones, consulte [Documentación de ALTER](../sql-reference/statements/alter.md#alter_manipulations-with-partitions).
 

From 0c04f4d00896683a203a7ccc17be7058c50d75fb Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 14 Sep 2020 10:01:20 +0300
Subject: [PATCH 167/341] Update cluster.py

---
 tests/integration/helpers/cluster.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index a8704ee42b1..4d336838eb7 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1165,11 +1165,12 @@ class ClickHouseInstance:
 
         db_dir = p.abspath(p.join(self.path, 'database'))
         print "Setup database dir {}".format(db_dir)
-        os.mkdir(db_dir)
         if self.clickhouse_path_dir is not None:
             print "Database files taken from {}".format(self.clickhouse_path_dir)
             shutil.copytree(self.clickhouse_path_dir, db_dir)
             print "Database copied from {} to {}".format(self.clickhouse_path_dir, db_dir)
+        else:
+            os.mkdir(db_dir)
 
         logs_dir = p.abspath(p.join(self.path, 'logs'))
         print "Setup logs dir {}".format(logs_dir)

From b0e6df1532e11f3dd6b285efe73edb2b236bda57 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 14 Sep 2020 10:20:42 +0300
Subject: [PATCH 168/341] Trying to fix build

---
 docker/packager/deb/Dockerfile | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/docker/packager/deb/Dockerfile b/docker/packager/deb/Dockerfile
index a3c87f13fe4..0b3395e1e01 100644
--- a/docker/packager/deb/Dockerfile
+++ b/docker/packager/deb/Dockerfile
@@ -24,13 +24,6 @@ RUN apt-get update \
         software-properties-common \
         --yes --no-install-recommends
 
-# Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
-# to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
-# Significantly increase deb packaging speed and compatible with old systems
-RUN curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb \
-    && chmod +x dpkg-deb \
-    && cp dpkg-deb /usr/bin
-
 ENV APACHE_PUBKEY_HASH="bba6987b63c63f710fd4ed476121c588bc3812e99659d27a855f8c4d312783ee66ad6adfce238765691b04d62fa3688f"
 
 RUN  export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
@@ -38,6 +31,13 @@ RUN  export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
     && echo "${APACHE_PUBKEY_HASH} /tmp/arrow-keyring.deb" | sha384sum -c \
     && dpkg -i /tmp/arrow-keyring.deb
 
+# Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
+# to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
+# Significantly increase deb packaging speed and compatible with old systems
+RUN curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb \
+  && chmod +x dpkg-deb \
+  && cp dpkg-deb /usr/bin
+
 
 # Libraries from OS are only needed to test the "unbundled" build (this is not used in production).
 RUN apt-get update \

From c701a15271a3b0900beb132e0071573254fc2804 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Mon, 14 Sep 2020 10:27:46 +0300
Subject: [PATCH 169/341] fixup

---
 docker/test/performance-comparison/report.py | 5 +++--
 tests/performance/joins_in_memory_pmj.xml    | 2 +-
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/docker/test/performance-comparison/report.py b/docker/test/performance-comparison/report.py
index b3f8ef01138..e9e2ac68c1e 100755
--- a/docker/test/performance-comparison/report.py
+++ b/docker/test/performance-comparison/report.py
@@ -470,12 +470,13 @@ if args.report == 'main':
         text = tableStart('Test times')
         text += tableHeader(columns)
 
-        nominal_runs = 13  # FIXME pass this as an argument
+        nominal_runs = 7  # FIXME pass this as an argument
         total_runs = (nominal_runs + 1) * 2  # one prewarm run, two servers
+        allowed_average_run_time = allowed_single_run_time + 60 / total_runs; # some allowance for fill/create queries
         attrs = ['' for c in columns]
         for r in rows:
             anchor = f'{currentTableAnchor()}.{r[0]}'
-            if float(r[6]) > 1.5 * total_runs:
+            if float(r[6]) > allowed_average_run_time * total_runs:
                 # FIXME should be 15s max -- investigate parallel_insert
                 slow_average_tests += 1
                 attrs[6] = f'style="background: {color_bad}"'
diff --git a/tests/performance/joins_in_memory_pmj.xml b/tests/performance/joins_in_memory_pmj.xml
index bbdc4357ecb..e8d1d80a12b 100644
--- a/tests/performance/joins_in_memory_pmj.xml
+++ b/tests/performance/joins_in_memory_pmj.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.2">
+<test max_ignored_relative_change="1.0">
     <create_query>CREATE TABLE ints (i64 Int64, i32 Int32, i16 Int16, i8 Int8) ENGINE = Memory</create_query>
     <create_query>SET join_algorithm = 'partial_merge'</create_query>
 

From 3113aa6cfefbf5eee6de6541ffd1f20596f8f8d2 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Mon, 14 Sep 2020 10:59:45 +0300
Subject: [PATCH 170/341] Avoid extra error in perf report on broken queries

---
 docker/test/performance-comparison/compare.sh    | 12 ++++++++++++
 tests/performance/{ => broken}/decimal_casts.xml |  0
 2 files changed, 12 insertions(+)
 rename tests/performance/{ => broken}/decimal_casts.xml (100%)

diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index 364e9994ab7..08f4cb599ab 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -394,12 +394,24 @@ create table query_run_metrics_denorm engine File(TSV, 'analyze/query-run-metric
     order by test, query_index, metric_names, version, query_id
     ;
 
+-- Filter out tests that don't have an even number of runs, to avoid breaking
+-- the further calculations. This may happen if there was an error during the
+-- test runs, e.g. the server died. It will be reported in test errors, so we
+-- don't have to report it again.
+create view broken_queries as
+    select test, query_index
+    from query_runs
+    group by test, query_index
+    having count(*) % 2 != 0
+    ;
+
 -- This is for statistical processing with eqmed.sql
 create table query_run_metrics_for_stats engine File(
         TSV, -- do not add header -- will parse with grep
         'analyze/query-run-metrics-for-stats.tsv')
     as select test, query_index, 0 run, version, metric_values
     from query_run_metric_arrays
+    where (test, query_index) not in broken_queries
     order by test, query_index, run, version
     ;
 
diff --git a/tests/performance/decimal_casts.xml b/tests/performance/broken/decimal_casts.xml
similarity index 100%
rename from tests/performance/decimal_casts.xml
rename to tests/performance/broken/decimal_casts.xml

From e519e2b87a014b8a2ddc709aeaea889f6e81e08a Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 14 Sep 2020 11:16:00 +0300
Subject: [PATCH 171/341] Use patched dpkg on build stage

---
 docker/packager/deb/Dockerfile     | 9 +--------
 docker/packager/deb/build.sh       | 7 +++++++
 docker/packager/unbundled/build.sh | 7 +++++++
 3 files changed, 15 insertions(+), 8 deletions(-)

diff --git a/docker/packager/deb/Dockerfile b/docker/packager/deb/Dockerfile
index 0b3395e1e01..9c24e9600eb 100644
--- a/docker/packager/deb/Dockerfile
+++ b/docker/packager/deb/Dockerfile
@@ -26,18 +26,11 @@ RUN apt-get update \
 
 ENV APACHE_PUBKEY_HASH="bba6987b63c63f710fd4ed476121c588bc3812e99659d27a855f8c4d312783ee66ad6adfce238765691b04d62fa3688f"
 
-RUN  export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
+RUN export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
     && wget -nv -O /tmp/arrow-keyring.deb "https://apache.bintray.com/arrow/ubuntu/apache-arrow-archive-keyring-latest-${CODENAME}.deb" \
     && echo "${APACHE_PUBKEY_HASH} /tmp/arrow-keyring.deb" | sha384sum -c \
     && dpkg -i /tmp/arrow-keyring.deb
 
-# Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
-# to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
-# Significantly increase deb packaging speed and compatible with old systems
-RUN curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb \
-  && chmod +x dpkg-deb \
-  && cp dpkg-deb /usr/bin
-
 
 # Libraries from OS are only needed to test the "unbundled" build (this is not used in production).
 RUN apt-get update \
diff --git a/docker/packager/deb/build.sh b/docker/packager/deb/build.sh
index fbaa0151c6b..4b7ab146b9f 100755
--- a/docker/packager/deb/build.sh
+++ b/docker/packager/deb/build.sh
@@ -2,6 +2,13 @@
 
 set -x -e
 
+# Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
+# to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
+# Significantly increase deb packaging speed and compatible with old systems
+curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb \
+    && chmod +x dpkg-deb \
+    && cp dpkg-deb /usr/bin
+
 ccache --show-stats ||:
 ccache --zero-stats ||:
 build/release --no-pbuilder $ALIEN_PKGS | ts '%Y-%m-%d %H:%M:%S'
diff --git a/docker/packager/unbundled/build.sh b/docker/packager/unbundled/build.sh
index ca1217ac522..aaa3b2eb87b 100755
--- a/docker/packager/unbundled/build.sh
+++ b/docker/packager/unbundled/build.sh
@@ -2,6 +2,13 @@
 
 set -x -e
 
+# Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
+# to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
+# Significantly increase deb packaging speed and compatible with old systems
+curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb \
+    && chmod +x dpkg-deb \
+    && cp dpkg-deb /usr/bin
+
 ccache --show-stats ||:
 ccache --zero-stats ||:
 build/release --no-pbuilder $ALIEN_PKGS | ts '%Y-%m-%d %H:%M:%S'

From 558164bf24da8d8d29e94bcd7a91737788e6d46f Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 14 Sep 2020 11:17:59 +0300
Subject: [PATCH 172/341] Add retries

---
 docker/packager/deb/build.sh       | 18 +++++++++++++++---
 docker/packager/unbundled/build.sh | 18 +++++++++++++++---
 2 files changed, 30 insertions(+), 6 deletions(-)

diff --git a/docker/packager/deb/build.sh b/docker/packager/deb/build.sh
index 4b7ab146b9f..8ebf3caca59 100755
--- a/docker/packager/deb/build.sh
+++ b/docker/packager/deb/build.sh
@@ -5,9 +5,21 @@ set -x -e
 # Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
 # to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
 # Significantly increase deb packaging speed and compatible with old systems
-curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb \
-    && chmod +x dpkg-deb \
-    && cp dpkg-deb /usr/bin
+
+counter=0
+until curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb
+do
+    sleep 0.5
+    counter=$(($counter + 1))
+    echo "Cannot fetch better dpgk, retry $counter"
+    if [ "$counter" -gt 120 ]
+    then
+        echo "Cannot fetch busybox image all retries exceeded"
+        exit 1
+    fi
+done
+
+chmod +x dpkg-deb && cp dpkg-deb /usr/bin
 
 ccache --show-stats ||:
 ccache --zero-stats ||:
diff --git a/docker/packager/unbundled/build.sh b/docker/packager/unbundled/build.sh
index aaa3b2eb87b..77c27ce4a2c 100755
--- a/docker/packager/unbundled/build.sh
+++ b/docker/packager/unbundled/build.sh
@@ -5,9 +5,21 @@ set -x -e
 # Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
 # to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
 # Significantly increase deb packaging speed and compatible with old systems
-curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb \
-    && chmod +x dpkg-deb \
-    && cp dpkg-deb /usr/bin
+
+counter=0
+until curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb
+do
+    sleep 0.5
+    counter=$(($counter + 1))
+    echo "Cannot fetch better dpgk, retry $counter"
+    if [ "$counter" -gt 120 ]
+    then
+        echo "Cannot fetch busybox image all retries exceeded"
+        exit 1
+    fi
+done
+
+chmod +x dpkg-deb && cp dpkg-deb /usr/bin
 
 ccache --show-stats ||:
 ccache --zero-stats ||:

From fb7fc28e6f78c2b65cd498ce73870d3f77b212a3 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 14 Sep 2020 12:20:43 +0300
Subject: [PATCH 173/341] Update warnings.cmake

---
 cmake/warnings.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmake/warnings.cmake b/cmake/warnings.cmake
index 425972f00d8..6b26b9b95a5 100644
--- a/cmake/warnings.cmake
+++ b/cmake/warnings.cmake
@@ -23,7 +23,7 @@ option (WEVERYTHING "Enables -Weverything option with some exceptions. This is i
 # Control maximum size of stack frames. It can be important if the code is run in fibers with small stack size.
 # Only in release build because debug has too large stack frames.
 if ((NOT CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG") AND (NOT SANITIZE))
-    add_warning(frame-larger-than=16384)
+    add_warning(frame-larger-than=32768)
 endif ()
 
 if (COMPILER_CLANG)

From 654245af3c584d08541b003eb435f3981494336a Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Mon, 14 Sep 2020 11:34:14 +0800
Subject: [PATCH 174/341] Fix signedness conversion monotonicity

---
 src/Functions/FunctionsConversion.h           | 24 ++++++-------------
 ...gnedness_conversion_monotonicity.reference |  1 +
 ...496_signedness_conversion_monotonicity.sql |  9 +++++++
 3 files changed, 17 insertions(+), 17 deletions(-)
 create mode 100644 tests/queries/0_stateless/01496_signedness_conversion_monotonicity.reference
 create mode 100644 tests/queries/0_stateless/01496_signedness_conversion_monotonicity.sql

diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index ffe7677afe7..2210c61d157 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -1570,25 +1570,15 @@ struct ToNumberMonotonicity
             if (left.isNull() || right.isNull())
                 return {};
 
-            if (from_is_unsigned == to_is_unsigned)
-            {
-                /// all bits other than that fits, must be same.
-                if (divideByRangeOfType(left.get<UInt64>()) == divideByRangeOfType(right.get<UInt64>()))
-                    return {true};
-
+            /// Function cannot be monotonic when left and right are not on the same ranges.
+            if (divideByRangeOfType(left.get<UInt64>()) != divideByRangeOfType(right.get<UInt64>()))
                 return {};
-            }
+
+            if (to_is_unsigned)
+                return {true};
             else
-            {
-                /// When signedness is changed, it's also required for arguments to be from the same half.
-                /// And they must be in the same half after converting to the result type.
-                if (left_in_first_half == right_in_first_half
-                    && (T(left.get<Int64>()) >= 0) == (T(right.get<Int64>()) >= 0)
-                    && divideByRangeOfType(left.get<UInt64>()) == divideByRangeOfType(right.get<UInt64>()))
-                    return {true};
-
-                return {};
-            }
+                // If To is signed, it's possible that the signedness is different after conversion. So we check it explicitly.
+                return {(T(left.get<UInt64>()) >= 0) == (T(right.get<UInt64>()) >= 0)};
         }
 
         __builtin_unreachable();
diff --git a/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.reference b/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.sql b/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.sql
new file mode 100644
index 00000000000..5c87ba3c57c
--- /dev/null
+++ b/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.sql
@@ -0,0 +1,9 @@
+drop table if exists test1;
+
+create table test1 (i Int64) engine MergeTree order by i;
+
+insert into test1 values (53), (1777), (53284);
+
+select count() from test1 where toInt16(i) = 1777;
+
+drop table if exists test1;

From 59985707622589db3683d8b15b14f096c93a9453 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Mon, 14 Sep 2020 11:34:14 +0800
Subject: [PATCH 175/341] Fix signedness conversion monotonicity

---
 src/Functions/FunctionsConversion.h           | 24 ++++++-------------
 ...gnedness_conversion_monotonicity.reference |  1 +
 ...496_signedness_conversion_monotonicity.sql |  9 +++++++
 3 files changed, 17 insertions(+), 17 deletions(-)
 create mode 100644 tests/queries/0_stateless/01496_signedness_conversion_monotonicity.reference
 create mode 100644 tests/queries/0_stateless/01496_signedness_conversion_monotonicity.sql

diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index ffe7677afe7..2210c61d157 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -1570,25 +1570,15 @@ struct ToNumberMonotonicity
             if (left.isNull() || right.isNull())
                 return {};
 
-            if (from_is_unsigned == to_is_unsigned)
-            {
-                /// all bits other than that fits, must be same.
-                if (divideByRangeOfType(left.get<UInt64>()) == divideByRangeOfType(right.get<UInt64>()))
-                    return {true};
-
+            /// Function cannot be monotonic when left and right are not on the same ranges.
+            if (divideByRangeOfType(left.get<UInt64>()) != divideByRangeOfType(right.get<UInt64>()))
                 return {};
-            }
+
+            if (to_is_unsigned)
+                return {true};
             else
-            {
-                /// When signedness is changed, it's also required for arguments to be from the same half.
-                /// And they must be in the same half after converting to the result type.
-                if (left_in_first_half == right_in_first_half
-                    && (T(left.get<Int64>()) >= 0) == (T(right.get<Int64>()) >= 0)
-                    && divideByRangeOfType(left.get<UInt64>()) == divideByRangeOfType(right.get<UInt64>()))
-                    return {true};
-
-                return {};
-            }
+                // If To is signed, it's possible that the signedness is different after conversion. So we check it explicitly.
+                return {(T(left.get<UInt64>()) >= 0) == (T(right.get<UInt64>()) >= 0)};
         }
 
         __builtin_unreachable();
diff --git a/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.reference b/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.sql b/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.sql
new file mode 100644
index 00000000000..5c87ba3c57c
--- /dev/null
+++ b/tests/queries/0_stateless/01496_signedness_conversion_monotonicity.sql
@@ -0,0 +1,9 @@
+drop table if exists test1;
+
+create table test1 (i Int64) engine MergeTree order by i;
+
+insert into test1 values (53), (1777), (53284);
+
+select count() from test1 where toInt16(i) = 1777;
+
+drop table if exists test1;

From 004b91511d8aa1b597d882ea9114f07c9cbeee1b Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Mon, 14 Sep 2020 18:16:22 +0800
Subject: [PATCH 176/341] Fix wrong code

---
 src/Functions/FunctionBinaryArithmetic.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index cffcdc88dd6..bbac58a92c6 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -1367,7 +1367,7 @@ public:
             // variable / constant
             else if (right.column && isColumnConst(*right.column))
             {
-                auto constant = (*left.column)[0];
+                auto constant = (*right.column)[0];
                 if (applyVisitor(FieldVisitorAccurateEquals(), constant, Field(0)))
                     return {false, true, false}; // variable / 0 is undefined, let's treat it as non-monotonic
 

From d274125c74c4784b461e938a92c0afd2cb2e9b41 Mon Sep 17 00:00:00 2001
From: Artem Zuikov <chertus@gmail.com>
Date: Mon, 14 Sep 2020 14:56:43 +0300
Subject: [PATCH 177/341] Fix wide integer left shift + refactoring (#14697)

---
 base/common/throwError.h                      |  13 +
 base/common/types.h                           |  10 +-
 base/common/wide_integer.h                    | 134 ++---
 base/common/wide_integer_impl.h               | 477 +++++++++---------
 base/common/wide_integer_to_string.h          |  35 ++
 src/IO/WriteHelpers.h                         |   7 +
 .../01475_fix_bigint_shift.reference          |   2 +
 .../0_stateless/01475_fix_bigint_shift.sql    |   2 +
 8 files changed, 366 insertions(+), 314 deletions(-)
 create mode 100644 base/common/throwError.h
 create mode 100644 base/common/wide_integer_to_string.h
 create mode 100644 tests/queries/0_stateless/01475_fix_bigint_shift.reference
 create mode 100644 tests/queries/0_stateless/01475_fix_bigint_shift.sql

diff --git a/base/common/throwError.h b/base/common/throwError.h
new file mode 100644
index 00000000000..b495a0fbc7a
--- /dev/null
+++ b/base/common/throwError.h
@@ -0,0 +1,13 @@
+#pragma once
+#include <stdexcept>
+
+/// Throw DB::Exception-like exception before its definition.
+/// DB::Exception derived from Poco::Exception derived from std::exception.
+/// DB::Exception generally cought as Poco::Exception. std::exception generally has other catch blocks and could lead to other outcomes.
+/// DB::Exception is not defined yet. It'd better to throw Poco::Exception but we do not want to include any big header here, even <string>.
+/// So we throw some std::exception instead in the hope its catch block is the same as DB::Exception one.
+template <typename T>
+inline void throwError(const T & err)
+{
+    throw std::runtime_error(err);
+}
diff --git a/base/common/types.h b/base/common/types.h
index a02398a3365..2982781ce1f 100644
--- a/base/common/types.h
+++ b/base/common/types.h
@@ -23,8 +23,8 @@ using UInt64 = uint64_t;
 
 using Int128 = __int128;
 
-using wInt256 = std::wide_integer<256, signed>;
-using wUInt256 = std::wide_integer<256, unsigned>;
+using wInt256 = wide::integer<256, signed>;
+using wUInt256 = wide::integer<256, unsigned>;
 
 static_assert(sizeof(wInt256) == 32);
 static_assert(sizeof(wUInt256) == 32);
@@ -119,12 +119,6 @@ template <> struct is_big_int<wUInt256> { static constexpr bool value = true; };
 template <typename T>
 inline constexpr bool is_big_int_v = is_big_int<T>::value;
 
-template <typename T>
-inline std::string bigintToString(const T & x)
-{
-    return to_string(x);
-}
-
 template <typename To, typename From>
 inline To bigint_cast(const From & x [[maybe_unused]])
 {
diff --git a/base/common/wide_integer.h b/base/common/wide_integer.h
index 67d0b3f04da..2aeac072b3f 100644
--- a/base/common/wide_integer.h
+++ b/base/common/wide_integer.h
@@ -22,79 +22,87 @@
  * without express or implied warranty.
  */
 
-#include <climits> // CHAR_BIT
-#include <cmath>
 #include <cstdint>
 #include <limits>
 #include <type_traits>
+#include <initializer_list>
+
+namespace wide
+{
+template <size_t Bits, typename Signed>
+class integer;
+}
 
 namespace std
 {
-template <size_t Bits, typename Signed>
-class wide_integer;
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-struct common_type<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>;
+struct common_type<wide::integer<Bits, Signed>, wide::integer<Bits2, Signed2>>;
 
 template <size_t Bits, typename Signed, typename Arithmetic>
-struct common_type<wide_integer<Bits, Signed>, Arithmetic>;
+struct common_type<wide::integer<Bits, Signed>, Arithmetic>;
 
 template <typename Arithmetic, size_t Bits, typename Signed>
-struct common_type<Arithmetic, wide_integer<Bits, Signed>>;
+struct common_type<Arithmetic, wide::integer<Bits, Signed>>;
+
+}
+
+namespace wide
+{
 
 template <size_t Bits, typename Signed>
-class wide_integer
+class integer
 {
 public:
     using base_type = uint8_t;
     using signed_base_type = int8_t;
 
     // ctors
-    wide_integer() = default;
+    integer() = default;
 
     template <typename T>
-    constexpr wide_integer(T rhs) noexcept;
+    constexpr integer(T rhs) noexcept;
     template <typename T>
-    constexpr wide_integer(std::initializer_list<T> il) noexcept;
+    constexpr integer(std::initializer_list<T> il) noexcept;
 
     // assignment
     template <size_t Bits2, typename Signed2>
-    constexpr wide_integer<Bits, Signed> & operator=(const wide_integer<Bits2, Signed2> & rhs) noexcept;
+    constexpr integer<Bits, Signed> & operator=(const integer<Bits2, Signed2> & rhs) noexcept;
 
     template <typename Arithmetic>
-    constexpr wide_integer<Bits, Signed> & operator=(Arithmetic rhs) noexcept;
+    constexpr integer<Bits, Signed> & operator=(Arithmetic rhs) noexcept;
 
     template <typename Arithmetic>
-    constexpr wide_integer<Bits, Signed> & operator*=(const Arithmetic & rhs);
+    constexpr integer<Bits, Signed> & operator*=(const Arithmetic & rhs);
 
     template <typename Arithmetic>
-    constexpr wide_integer<Bits, Signed> & operator/=(const Arithmetic & rhs);
+    constexpr integer<Bits, Signed> & operator/=(const Arithmetic & rhs);
 
     template <typename Arithmetic>
-    constexpr wide_integer<Bits, Signed> & operator+=(const Arithmetic & rhs) noexcept(is_same<Signed, unsigned>::value);
+    constexpr integer<Bits, Signed> & operator+=(const Arithmetic & rhs) noexcept(std::is_same_v<Signed, unsigned>);
 
     template <typename Arithmetic>
-    constexpr wide_integer<Bits, Signed> & operator-=(const Arithmetic & rhs) noexcept(is_same<Signed, unsigned>::value);
+    constexpr integer<Bits, Signed> & operator-=(const Arithmetic & rhs) noexcept(std::is_same_v<Signed, unsigned>);
 
     template <typename Integral>
-    constexpr wide_integer<Bits, Signed> & operator%=(const Integral & rhs);
+    constexpr integer<Bits, Signed> & operator%=(const Integral & rhs);
 
     template <typename Integral>
-    constexpr wide_integer<Bits, Signed> & operator&=(const Integral & rhs) noexcept;
+    constexpr integer<Bits, Signed> & operator&=(const Integral & rhs) noexcept;
 
     template <typename Integral>
-    constexpr wide_integer<Bits, Signed> & operator|=(const Integral & rhs) noexcept;
+    constexpr integer<Bits, Signed> & operator|=(const Integral & rhs) noexcept;
 
     template <typename Integral>
-    constexpr wide_integer<Bits, Signed> & operator^=(const Integral & rhs) noexcept;
+    constexpr integer<Bits, Signed> & operator^=(const Integral & rhs) noexcept;
 
-    constexpr wide_integer<Bits, Signed> & operator<<=(int n);
-    constexpr wide_integer<Bits, Signed> & operator>>=(int n) noexcept;
+    constexpr integer<Bits, Signed> & operator<<=(int n) noexcept;
+    constexpr integer<Bits, Signed> & operator>>=(int n) noexcept;
 
-    constexpr wide_integer<Bits, Signed> & operator++() noexcept(is_same<Signed, unsigned>::value);
-    constexpr wide_integer<Bits, Signed> operator++(int) noexcept(is_same<Signed, unsigned>::value);
-    constexpr wide_integer<Bits, Signed> & operator--() noexcept(is_same<Signed, unsigned>::value);
-    constexpr wide_integer<Bits, Signed> operator--(int) noexcept(is_same<Signed, unsigned>::value);
+    constexpr integer<Bits, Signed> & operator++() noexcept(std::is_same_v<Signed, unsigned>);
+    constexpr integer<Bits, Signed> operator++(int) noexcept(std::is_same_v<Signed, unsigned>);
+    constexpr integer<Bits, Signed> & operator--() noexcept(std::is_same_v<Signed, unsigned>);
+    constexpr integer<Bits, Signed> operator--(int) noexcept(std::is_same_v<Signed, unsigned>);
 
     // observers
 
@@ -114,10 +122,10 @@ public:
 
 private:
     template <size_t Bits2, typename Signed2>
-    friend class wide_integer;
+    friend class integer;
 
-    friend class numeric_limits<wide_integer<Bits, signed>>;
-    friend class numeric_limits<wide_integer<Bits, unsigned>>;
+    friend class std::numeric_limits<integer<Bits, signed>>;
+    friend class std::numeric_limits<integer<Bits, unsigned>>;
 
     base_type m_arr[_impl::arr_size];
 };
@@ -134,115 +142,117 @@ using __only_integer = typename std::enable_if<IntegralConcept<T>() && IntegralC
 
 // Unary operators
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator~(const wide_integer<Bits, Signed> & lhs) noexcept;
+constexpr integer<Bits, Signed> operator~(const integer<Bits, Signed> & lhs) noexcept;
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator-(const wide_integer<Bits, Signed> & lhs) noexcept(is_same<Signed, unsigned>::value);
+constexpr integer<Bits, Signed> operator-(const integer<Bits, Signed> & lhs) noexcept(std::is_same_v<Signed, unsigned>);
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator+(const wide_integer<Bits, Signed> & lhs) noexcept(is_same<Signed, unsigned>::value);
+constexpr integer<Bits, Signed> operator+(const integer<Bits, Signed> & lhs) noexcept(std::is_same_v<Signed, unsigned>);
 
 // Binary operators
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator*(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator*(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 std::common_type_t<Arithmetic, Arithmetic2> constexpr operator*(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator/(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator/(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 std::common_type_t<Arithmetic, Arithmetic2> constexpr operator/(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator+(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator+(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 std::common_type_t<Arithmetic, Arithmetic2> constexpr operator+(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator-(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator-(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 std::common_type_t<Arithmetic, Arithmetic2> constexpr operator-(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator%(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator%(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Integral, typename Integral2, class = __only_integer<Integral, Integral2>>
 std::common_type_t<Integral, Integral2> constexpr operator%(const Integral & rhs, const Integral2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator&(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator&(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Integral, typename Integral2, class = __only_integer<Integral, Integral2>>
 std::common_type_t<Integral, Integral2> constexpr operator&(const Integral & rhs, const Integral2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator|(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator|(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Integral, typename Integral2, class = __only_integer<Integral, Integral2>>
 std::common_type_t<Integral, Integral2> constexpr operator|(const Integral & rhs, const Integral2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator^(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator^(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Integral, typename Integral2, class = __only_integer<Integral, Integral2>>
 std::common_type_t<Integral, Integral2> constexpr operator^(const Integral & rhs, const Integral2 & lhs);
 
 // TODO: Integral
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator<<(const wide_integer<Bits, Signed> & lhs, int n) noexcept;
+constexpr integer<Bits, Signed> operator<<(const integer<Bits, Signed> & lhs, int n) noexcept;
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator>>(const wide_integer<Bits, Signed> & lhs, int n) noexcept;
+constexpr integer<Bits, Signed> operator>>(const integer<Bits, Signed> & lhs, int n) noexcept;
 
 template <size_t Bits, typename Signed, typename Int, typename = std::enable_if_t<!std::is_same_v<Int, int>>>
-constexpr wide_integer<Bits, Signed> operator<<(const wide_integer<Bits, Signed> & lhs, Int n) noexcept
+constexpr integer<Bits, Signed> operator<<(const integer<Bits, Signed> & lhs, Int n) noexcept
 {
     return lhs << int(n);
 }
 template <size_t Bits, typename Signed, typename Int, typename = std::enable_if_t<!std::is_same_v<Int, int>>>
-constexpr wide_integer<Bits, Signed> operator>>(const wide_integer<Bits, Signed> & lhs, Int n) noexcept
+constexpr integer<Bits, Signed> operator>>(const integer<Bits, Signed> & lhs, Int n) noexcept
 {
     return lhs >> int(n);
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator<(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+constexpr bool operator<(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 constexpr bool operator<(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator>(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+constexpr bool operator>(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 constexpr bool operator>(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator<=(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+constexpr bool operator<=(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 constexpr bool operator<=(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator>=(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+constexpr bool operator>=(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 constexpr bool operator>=(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator==(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+constexpr bool operator==(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 constexpr bool operator==(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator!=(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs);
+constexpr bool operator!=(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs);
 template <typename Arithmetic, typename Arithmetic2, class = __only_arithmetic<Arithmetic, Arithmetic2>>
 constexpr bool operator!=(const Arithmetic & rhs, const Arithmetic2 & lhs);
 
-template <size_t Bits, typename Signed>
-std::string to_string(const wide_integer<Bits, Signed> & n);
+}
+
+namespace std
+{
 
 template <size_t Bits, typename Signed>
-struct hash<wide_integer<Bits, Signed>>;
+struct hash<wide::integer<Bits, Signed>>;
 
 }
 
diff --git a/base/common/wide_integer_impl.h b/base/common/wide_integer_impl.h
index c77a9120a55..26bd6704bdc 100644
--- a/base/common/wide_integer_impl.h
+++ b/base/common/wide_integer_impl.h
@@ -1,19 +1,47 @@
 /// Original is here https://github.com/cerevra/int
 #pragma once
 
-#include "wide_integer.h"
+#include "throwError.h"
 
-#include <array>
-#include <cstring>
+#ifndef CHAR_BIT
+#define CHAR_BIT 8
+#endif
+
+namespace wide
+{
+
+template <typename T>
+struct IsWideInteger
+{
+    static const constexpr bool value = false;
+};
+
+template <size_t Bits, typename Signed>
+struct IsWideInteger<wide::integer<Bits, Signed>>
+{
+    static const constexpr bool value = true;
+};
+
+template <typename T>
+static constexpr bool ArithmeticConcept() noexcept
+{
+    return std::is_arithmetic_v<T> || IsWideInteger<T>::value;
+}
+
+template <typename T>
+static constexpr bool IntegralConcept() noexcept
+{
+    return std::is_integral_v<T> || IsWideInteger<T>::value;
+}
+
+}
 
 namespace std
 {
-#define CT(x) \
-    std::common_type_t<std::decay_t<decltype(rhs)>, std::decay_t<decltype(lhs)>> { x }
 
 // numeric limits
 template <size_t Bits, typename Signed>
-class numeric_limits<wide_integer<Bits, Signed>>
+class numeric_limits<wide::integer<Bits, Signed>>
 {
 public:
     static constexpr bool is_specialized = true;
@@ -40,103 +68,84 @@ public:
     static constexpr bool traps = true;
     static constexpr bool tinyness_before = false;
 
-    static constexpr wide_integer<Bits, Signed> min() noexcept
+    static constexpr wide::integer<Bits, Signed> min() noexcept
     {
         if (is_same<Signed, signed>::value)
         {
-            using T = wide_integer<Bits, signed>;
+            using T = wide::integer<Bits, signed>;
             T res{};
-            res.m_arr[T::_impl::big(0)] = std::numeric_limits<typename wide_integer<Bits, Signed>::signed_base_type>::min();
+            res.m_arr[T::_impl::big(0)] = std::numeric_limits<typename wide::integer<Bits, Signed>::signed_base_type>::min();
             return res;
         }
         return 0;
     }
 
-    static constexpr wide_integer<Bits, Signed> max() noexcept
+    static constexpr wide::integer<Bits, Signed> max() noexcept
     {
-        using T = wide_integer<Bits, Signed>;
+        using T = wide::integer<Bits, Signed>;
         T res{};
         res.m_arr[T::_impl::big(0)] = is_same<Signed, signed>::value
-            ? std::numeric_limits<typename wide_integer<Bits, Signed>::signed_base_type>::max()
-            : std::numeric_limits<typename wide_integer<Bits, Signed>::base_type>::max();
-        for (int i = 1; i < wide_integer<Bits, Signed>::_impl::arr_size; ++i)
+            ? std::numeric_limits<typename wide::integer<Bits, Signed>::signed_base_type>::max()
+            : std::numeric_limits<typename wide::integer<Bits, Signed>::base_type>::max();
+        for (int i = 1; i < wide::integer<Bits, Signed>::_impl::arr_size; ++i)
         {
-            res.m_arr[T::_impl::big(i)] = std::numeric_limits<typename wide_integer<Bits, Signed>::base_type>::max();
+            res.m_arr[T::_impl::big(i)] = std::numeric_limits<typename wide::integer<Bits, Signed>::base_type>::max();
         }
         return res;
     }
 
-    static constexpr wide_integer<Bits, Signed> lowest() noexcept { return min(); }
-    static constexpr wide_integer<Bits, Signed> epsilon() noexcept { return 0; }
-    static constexpr wide_integer<Bits, Signed> round_error() noexcept { return 0; }
-    static constexpr wide_integer<Bits, Signed> infinity() noexcept { return 0; }
-    static constexpr wide_integer<Bits, Signed> quiet_NaN() noexcept { return 0; }
-    static constexpr wide_integer<Bits, Signed> signaling_NaN() noexcept { return 0; }
-    static constexpr wide_integer<Bits, Signed> denorm_min() noexcept { return 0; }
+    static constexpr wide::integer<Bits, Signed> lowest() noexcept { return min(); }
+    static constexpr wide::integer<Bits, Signed> epsilon() noexcept { return 0; }
+    static constexpr wide::integer<Bits, Signed> round_error() noexcept { return 0; }
+    static constexpr wide::integer<Bits, Signed> infinity() noexcept { return 0; }
+    static constexpr wide::integer<Bits, Signed> quiet_NaN() noexcept { return 0; }
+    static constexpr wide::integer<Bits, Signed> signaling_NaN() noexcept { return 0; }
+    static constexpr wide::integer<Bits, Signed> denorm_min() noexcept { return 0; }
 };
 
-template <typename T>
-struct IsWideInteger
-{
-    static const constexpr bool value = false;
-};
-
-template <size_t Bits, typename Signed>
-struct IsWideInteger<wide_integer<Bits, Signed>>
-{
-    static const constexpr bool value = true;
-};
-
-template <typename T>
-static constexpr bool ArithmeticConcept() noexcept
-{
-    return std::is_arithmetic_v<T> || IsWideInteger<T>::value;
-}
-
-template <typename T>
-static constexpr bool IntegralConcept() noexcept
-{
-    return std::is_integral_v<T> || IsWideInteger<T>::value;
-}
-
 // type traits
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-struct common_type<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>
+struct common_type<wide::integer<Bits, Signed>, wide::integer<Bits2, Signed2>>
 {
     using type = std::conditional_t < Bits == Bits2,
-          wide_integer<
+          wide::integer<
               Bits,
-              std::conditional_t<(std::is_same<Signed, Signed2>::value && std::is_same<Signed2, signed>::value), signed, unsigned>>,
-          std::conditional_t<Bits2<Bits, wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>>;
+              std::conditional_t<(std::is_same_v<Signed, Signed2> && std::is_same_v<Signed2, signed>), signed, unsigned>>,
+          std::conditional_t<Bits2<Bits, wide::integer<Bits, Signed>, wide::integer<Bits2, Signed2>>>;
 };
 
 template <size_t Bits, typename Signed, typename Arithmetic>
-struct common_type<wide_integer<Bits, Signed>, Arithmetic>
+struct common_type<wide::integer<Bits, Signed>, Arithmetic>
 {
-    static_assert(ArithmeticConcept<Arithmetic>(), "");
+    static_assert(wide::ArithmeticConcept<Arithmetic>());
 
     using type = std::conditional_t<
-        std::is_floating_point<Arithmetic>::value,
+        std::is_floating_point_v<Arithmetic>,
         Arithmetic,
         std::conditional_t<
             sizeof(Arithmetic) < Bits * sizeof(long),
-            wide_integer<Bits, Signed>,
+            wide::integer<Bits, Signed>,
             std::conditional_t<
                 Bits * sizeof(long) < sizeof(Arithmetic),
                 Arithmetic,
                 std::conditional_t<
-                    Bits * sizeof(long) == sizeof(Arithmetic) && (is_same<Signed, signed>::value || std::is_signed<Arithmetic>::value),
+                    Bits * sizeof(long) == sizeof(Arithmetic) && (std::is_same_v<Signed, signed> || std::is_signed_v<Arithmetic>),
                     Arithmetic,
-                    wide_integer<Bits, Signed>>>>>;
+                    wide::integer<Bits, Signed>>>>>;
 };
 
 template <typename Arithmetic, size_t Bits, typename Signed>
-struct common_type<Arithmetic, wide_integer<Bits, Signed>> : std::common_type<wide_integer<Bits, Signed>, Arithmetic>
+struct common_type<Arithmetic, wide::integer<Bits, Signed>> : common_type<wide::integer<Bits, Signed>, Arithmetic>
 {
 };
 
+}
+
+namespace wide
+{
+
 template <size_t Bits, typename Signed>
-struct wide_integer<Bits, Signed>::_impl
+struct integer<Bits, Signed>::_impl
 {
     static_assert(Bits % CHAR_BIT == 0, "=)");
 
@@ -152,7 +161,7 @@ struct wide_integer<Bits, Signed>::_impl
     static constexpr unsigned any(unsigned idx) { return idx; }
 
     template <size_t B, class T>
-    constexpr static bool is_negative(const wide_integer<B, T> & n) noexcept
+    constexpr static bool is_negative(const integer<B, T> & n) noexcept
     {
         if constexpr (std::is_same_v<T, signed>)
             return static_cast<signed_base_type>(n.m_arr[big(0)]) < 0;
@@ -161,7 +170,7 @@ struct wide_integer<Bits, Signed>::_impl
     }
 
     template <size_t B, class S>
-    constexpr static wide_integer<B, S> make_positive(const wide_integer<B, S> & n) noexcept
+    constexpr static integer<B, S> make_positive(const integer<B, S> & n) noexcept
     {
         return is_negative(n) ? operator_unary_minus(n) : n;
     }
@@ -178,7 +187,7 @@ struct wide_integer<Bits, Signed>::_impl
     }
 
     template <typename Integral>
-    constexpr static void wide_integer_from_bultin(wide_integer<Bits, Signed> & self, Integral rhs) noexcept
+    constexpr static void wide_integer_from_bultin(integer<Bits, Signed> & self, Integral rhs) noexcept
     {
         auto r = _impl::to_Integral(rhs);
 
@@ -197,7 +206,7 @@ struct wide_integer<Bits, Signed>::_impl
         }
     }
 
-    constexpr static void wide_integer_from_bultin(wide_integer<Bits, Signed> & self, double rhs) noexcept
+    constexpr static void wide_integer_from_bultin(integer<Bits, Signed> & self, double rhs) noexcept
     {
         if ((rhs > 0 && rhs < std::numeric_limits<uint64_t>::max()) || (rhs < 0 && rhs > std::numeric_limits<int64_t>::min()))
         {
@@ -223,10 +232,10 @@ struct wide_integer<Bits, Signed>::_impl
 
     template <size_t Bits2, typename Signed2>
     constexpr static void
-    wide_integer_from_wide_integer(wide_integer<Bits, Signed> & self, const wide_integer<Bits2, Signed2> & rhs) noexcept
+    wide_integer_from_wide_integer(integer<Bits, Signed> & self, const integer<Bits2, Signed2> & rhs) noexcept
     {
         //        int Bits_to_copy = std::min(arr_size, rhs.arr_size);
-        auto rhs_arr_size = wide_integer<Bits2, Signed2>::_impl::arr_size;
+        auto rhs_arr_size = integer<Bits2, Signed2>::_impl::arr_size;
         int base_elems_to_copy = _impl::arr_size < rhs_arr_size ? _impl::arr_size : rhs_arr_size;
         for (int i = 0; i < base_elems_to_copy; ++i)
         {
@@ -244,14 +253,14 @@ struct wide_integer<Bits, Signed>::_impl
         return sizeof(T) * CHAR_BIT <= Bits;
     }
 
-    constexpr static wide_integer<Bits, unsigned> shift_left(const wide_integer<Bits, unsigned> & rhs, int n)
+    constexpr static integer<Bits, unsigned> shift_left(const integer<Bits, unsigned> & rhs, int n) noexcept
     {
         if (static_cast<size_t>(n) >= base_bits * arr_size)
             return 0;
         if (n <= 0)
             return rhs;
 
-        wide_integer<Bits, Signed> lhs = rhs;
+        integer<Bits, Signed> lhs = rhs;
         int bit_shift = n % base_bits;
         unsigned n_bytes = n / base_bits;
         if (bit_shift)
@@ -275,23 +284,19 @@ struct wide_integer<Bits, Signed>::_impl
         return lhs;
     }
 
-    constexpr static wide_integer<Bits, signed> shift_left(const wide_integer<Bits, signed> & rhs, int n)
+    constexpr static integer<Bits, signed> shift_left(const integer<Bits, signed> & rhs, int n) noexcept
     {
-        // static_assert(is_negative(rhs), "shift left for negative lhsbers is underfined!");
-        if (is_negative(rhs))
-            throw std::runtime_error("shift left for negative lhsbers is underfined!");
-
-        return wide_integer<Bits, signed>(shift_left(wide_integer<Bits, unsigned>(rhs), n));
+        return integer<Bits, signed>(shift_left(integer<Bits, unsigned>(rhs), n));
     }
 
-    constexpr static wide_integer<Bits, unsigned> shift_right(const wide_integer<Bits, unsigned> & rhs, int n) noexcept
+    constexpr static integer<Bits, unsigned> shift_right(const integer<Bits, unsigned> & rhs, int n) noexcept
     {
         if (static_cast<size_t>(n) >= base_bits * arr_size)
             return 0;
         if (n <= 0)
             return rhs;
 
-        wide_integer<Bits, Signed> lhs = rhs;
+        integer<Bits, Signed> lhs = rhs;
         int bit_shift = n % base_bits;
         unsigned n_bytes = n / base_bits;
         if (bit_shift)
@@ -315,7 +320,7 @@ struct wide_integer<Bits, Signed>::_impl
         return lhs;
     }
 
-    constexpr static wide_integer<Bits, signed> shift_right(const wide_integer<Bits, signed> & rhs, int n) noexcept
+    constexpr static integer<Bits, signed> shift_right(const integer<Bits, signed> & rhs, int n) noexcept
     {
         if (static_cast<size_t>(n) >= base_bits * arr_size)
             return 0;
@@ -324,14 +329,14 @@ struct wide_integer<Bits, Signed>::_impl
 
         bool is_neg = is_negative(rhs);
         if (!is_neg)
-            return shift_right(wide_integer<Bits, unsigned>(rhs), n);
+            return shift_right(integer<Bits, unsigned>(rhs), n);
 
-        wide_integer<Bits, Signed> lhs = rhs;
+        integer<Bits, Signed> lhs = rhs;
         int bit_shift = n % base_bits;
         unsigned n_bytes = n / base_bits;
         if (bit_shift)
         {
-            lhs = shift_right(wide_integer<Bits, unsigned>(lhs), bit_shift);
+            lhs = shift_right(integer<Bits, unsigned>(lhs), bit_shift);
             lhs.m_arr[big(0)] |= std::numeric_limits<base_type>::max() << (base_bits - bit_shift);
         }
         if (n_bytes)
@@ -349,8 +354,8 @@ struct wide_integer<Bits, Signed>::_impl
     }
 
     template <typename T>
-    constexpr static wide_integer<Bits, Signed>
-    operator_plus_T(const wide_integer<Bits, Signed> & lhs, T rhs) noexcept(is_same<Signed, unsigned>::value)
+    constexpr static integer<Bits, Signed>
+    operator_plus_T(const integer<Bits, Signed> & lhs, T rhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
         if (rhs < 0)
             return _operator_minus_T(lhs, -rhs);
@@ -360,10 +365,10 @@ struct wide_integer<Bits, Signed>::_impl
 
 private:
     template <typename T>
-    constexpr static wide_integer<Bits, Signed>
-    _operator_minus_T(const wide_integer<Bits, Signed> & lhs, T rhs) noexcept(is_same<Signed, unsigned>::value)
+    constexpr static integer<Bits, Signed>
+    _operator_minus_T(const integer<Bits, Signed> & lhs, T rhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
-        wide_integer<Bits, Signed> res = lhs;
+        integer<Bits, Signed> res = lhs;
 
         bool is_underflow = false;
         int r_idx = 0;
@@ -399,10 +404,10 @@ private:
     }
 
     template <typename T>
-    constexpr static wide_integer<Bits, Signed>
-    _operator_plus_T(const wide_integer<Bits, Signed> & lhs, T rhs) noexcept(is_same<Signed, unsigned>::value)
+    constexpr static integer<Bits, Signed>
+    _operator_plus_T(const integer<Bits, Signed> & lhs, T rhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
-        wide_integer<Bits, Signed> res = lhs;
+        integer<Bits, Signed> res = lhs;
 
         bool is_overflow = false;
         int r_idx = 0;
@@ -438,27 +443,27 @@ private:
     }
 
 public:
-    constexpr static wide_integer<Bits, Signed> operator_unary_tilda(const wide_integer<Bits, Signed> & lhs) noexcept
+    constexpr static integer<Bits, Signed> operator_unary_tilda(const integer<Bits, Signed> & lhs) noexcept
     {
-        wide_integer<Bits, Signed> res{};
+        integer<Bits, Signed> res{};
 
         for (int i = 0; i < arr_size; ++i)
             res.m_arr[any(i)] = ~lhs.m_arr[any(i)];
         return res;
     }
 
-    constexpr static wide_integer<Bits, Signed>
-    operator_unary_minus(const wide_integer<Bits, Signed> & lhs) noexcept(is_same<Signed, unsigned>::value)
+    constexpr static integer<Bits, Signed>
+    operator_unary_minus(const integer<Bits, Signed> & lhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
         return operator_plus_T(operator_unary_tilda(lhs), 1);
     }
 
     template <typename T>
-    constexpr static auto operator_plus(const wide_integer<Bits, Signed> & lhs, const T & rhs) noexcept(is_same<Signed, unsigned>::value)
+    constexpr static auto operator_plus(const integer<Bits, Signed> & lhs, const T & rhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
         if constexpr (should_keep_size<T>())
         {
-            wide_integer<Bits, Signed> t = rhs;
+            integer<Bits, Signed> t = rhs;
             if (is_negative(t))
                 return _operator_minus_wide_integer(lhs, operator_unary_minus(t));
             else
@@ -467,17 +472,17 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<T::_impl::_Bits, Signed>>::_impl::operator_plus(
-                wide_integer<T::_impl::_Bits, Signed>(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, integer<T::_impl::_Bits, Signed>>::_impl::operator_plus(
+                integer<T::_impl::_Bits, Signed>(lhs), rhs);
         }
     }
 
     template <typename T>
-    constexpr static auto operator_minus(const wide_integer<Bits, Signed> & lhs, const T & rhs) noexcept(is_same<Signed, unsigned>::value)
+    constexpr static auto operator_minus(const integer<Bits, Signed> & lhs, const T & rhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
         if constexpr (should_keep_size<T>())
         {
-            wide_integer<Bits, Signed> t = rhs;
+            integer<Bits, Signed> t = rhs;
             if (is_negative(t))
                 return _operator_plus_wide_integer(lhs, operator_unary_minus(t));
             else
@@ -486,16 +491,16 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<T::_impl::_Bits, Signed>>::_impl::operator_minus(
-                wide_integer<T::_impl::_Bits, Signed>(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, integer<T::_impl::_Bits, Signed>>::_impl::operator_minus(
+                integer<T::_impl::_Bits, Signed>(lhs), rhs);
         }
     }
 
 private:
-    constexpr static wide_integer<Bits, Signed> _operator_minus_wide_integer(
-        const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits, Signed> & rhs) noexcept(is_same<Signed, unsigned>::value)
+    constexpr static integer<Bits, Signed> _operator_minus_wide_integer(
+        const integer<Bits, Signed> & lhs, const integer<Bits, Signed> & rhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
-        wide_integer<Bits, Signed> res = lhs;
+        integer<Bits, Signed> res = lhs;
 
         bool is_underflow = false;
         for (int idx = 0; idx < arr_size; ++idx)
@@ -518,10 +523,10 @@ private:
         return res;
     }
 
-    constexpr static wide_integer<Bits, Signed> _operator_plus_wide_integer(
-        const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits, Signed> & rhs) noexcept(is_same<Signed, unsigned>::value)
+    constexpr static integer<Bits, Signed> _operator_plus_wide_integer(
+        const integer<Bits, Signed> & lhs, const integer<Bits, Signed> & rhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
-        wide_integer<Bits, Signed> res = lhs;
+        integer<Bits, Signed> res = lhs;
 
         bool is_overflow = false;
         for (int idx = 0; idx < arr_size; ++idx)
@@ -546,14 +551,14 @@ private:
 
 public:
     template <typename T>
-    constexpr static auto operator_star(const wide_integer<Bits, Signed> & lhs, const T & rhs)
+    constexpr static auto operator_star(const integer<Bits, Signed> & lhs, const T & rhs)
     {
         if constexpr (should_keep_size<T>())
         {
-            const wide_integer<Bits, unsigned> a = make_positive(lhs);
-            wide_integer<Bits, unsigned> t = make_positive(wide_integer<Bits, Signed>(rhs));
+            const integer<Bits, unsigned> a = make_positive(lhs);
+            integer<Bits, unsigned> t = make_positive(integer<Bits, Signed>(rhs));
 
-            wide_integer<Bits, Signed> res = 0;
+            integer<Bits, Signed> res = 0;
 
             for (size_t i = 0; i < arr_size * base_bits; ++i)
             {
@@ -563,7 +568,7 @@ public:
                 t = shift_right(t, 1);
             }
 
-            if (is_same<Signed, signed>::value && is_negative(wide_integer<Bits, Signed>(rhs)) != is_negative(lhs))
+            if (std::is_same_v<Signed, signed> && is_negative(integer<Bits, Signed>(rhs)) != is_negative(lhs))
                 res = operator_unary_minus(res);
 
             return res;
@@ -571,19 +576,19 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, T>::_impl::operator_star(T(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_star(T(lhs), rhs);
         }
     }
 
     template <typename T>
-    constexpr static bool operator_more(const wide_integer<Bits, Signed> & lhs, const T & rhs) noexcept
+    constexpr static bool operator_more(const integer<Bits, Signed> & lhs, const T & rhs) noexcept
     {
         if constexpr (should_keep_size<T>())
         {
             // static_assert(Signed == std::is_signed<T>::value,
             //               "warning: operator_more: comparison of integers of different signs");
 
-            wide_integer<Bits, Signed> t = rhs;
+            integer<Bits, Signed> t = rhs;
 
             if (std::numeric_limits<T>::is_signed && (is_negative(lhs) != is_negative(t)))
                 return is_negative(t);
@@ -599,19 +604,19 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, T>::_impl::operator_more(T(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_more(T(lhs), rhs);
         }
     }
 
     template <typename T>
-    constexpr static bool operator_less(const wide_integer<Bits, Signed> & lhs, const T & rhs) noexcept
+    constexpr static bool operator_less(const integer<Bits, Signed> & lhs, const T & rhs) noexcept
     {
         if constexpr (should_keep_size<T>())
         {
             // static_assert(Signed == std::is_signed<T>::value,
             //               "warning: operator_less: comparison of integers of different signs");
 
-            wide_integer<Bits, Signed> t = rhs;
+            integer<Bits, Signed> t = rhs;
 
             if (std::numeric_limits<T>::is_signed && (is_negative(lhs) != is_negative(t)))
                 return is_negative(lhs);
@@ -625,16 +630,16 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, T>::_impl::operator_less(T(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_less(T(lhs), rhs);
         }
     }
 
     template <typename T>
-    constexpr static bool operator_eq(const wide_integer<Bits, Signed> & lhs, const T & rhs) noexcept
+    constexpr static bool operator_eq(const integer<Bits, Signed> & lhs, const T & rhs) noexcept
     {
         if constexpr (should_keep_size<T>())
         {
-            wide_integer<Bits, Signed> t = rhs;
+            integer<Bits, Signed> t = rhs;
 
             for (int i = 0; i < arr_size; ++i)
                 if (lhs.m_arr[any(i)] != t.m_arr[any(i)])
@@ -645,17 +650,17 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, T>::_impl::operator_eq(T(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_eq(T(lhs), rhs);
         }
     }
 
     template <typename T>
-    constexpr static auto operator_pipe(const wide_integer<Bits, Signed> & lhs, const T & rhs) noexcept
+    constexpr static auto operator_pipe(const integer<Bits, Signed> & lhs, const T & rhs) noexcept
     {
         if constexpr (should_keep_size<T>())
         {
-            wide_integer<Bits, Signed> t = rhs;
-            wide_integer<Bits, Signed> res = lhs;
+            integer<Bits, Signed> t = rhs;
+            integer<Bits, Signed> res = lhs;
 
             for (int i = 0; i < arr_size; ++i)
                 res.m_arr[any(i)] |= t.m_arr[any(i)];
@@ -664,17 +669,17 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, T>::_impl::operator_pipe(T(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_pipe(T(lhs), rhs);
         }
     }
 
     template <typename T>
-    constexpr static auto operator_amp(const wide_integer<Bits, Signed> & lhs, const T & rhs) noexcept
+    constexpr static auto operator_amp(const integer<Bits, Signed> & lhs, const T & rhs) noexcept
     {
         if constexpr (should_keep_size<T>())
         {
-            wide_integer<Bits, Signed> t = rhs;
-            wide_integer<Bits, Signed> res = lhs;
+            integer<Bits, Signed> t = rhs;
+            integer<Bits, Signed> res = lhs;
 
             for (int i = 0; i < arr_size; ++i)
                 res.m_arr[any(i)] &= t.m_arr[any(i)];
@@ -683,7 +688,7 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, T>::_impl::operator_amp(T(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_amp(T(lhs), rhs);
         }
     }
 
@@ -702,7 +707,7 @@ private:
         }
 
         if (is_zero)
-            throw std::domain_error("divide by zero");
+            throwError("divide by zero");
 
         T n = lhserator;
         T d = denominator;
@@ -733,15 +738,15 @@ private:
 
 public:
     template <typename T>
-    constexpr static auto operator_slash(const wide_integer<Bits, Signed> & lhs, const T & rhs)
+    constexpr static auto operator_slash(const integer<Bits, Signed> & lhs, const T & rhs)
     {
         if constexpr (should_keep_size<T>())
         {
-            wide_integer<Bits, Signed> o = rhs;
-            wide_integer<Bits, Signed> quotient{}, remainder{};
+            integer<Bits, Signed> o = rhs;
+            integer<Bits, Signed> quotient{}, remainder{};
             divide(make_positive(lhs), make_positive(o), quotient, remainder);
 
-            if (is_same<Signed, signed>::value && is_negative(o) != is_negative(lhs))
+            if (std::is_same_v<Signed, signed> && is_negative(o) != is_negative(lhs))
                 quotient = operator_unary_minus(quotient);
 
             return quotient;
@@ -749,20 +754,20 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<T::_impl::_Bits, Signed>>::operator_slash(T(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, integer<T::_impl::_Bits, Signed>>::operator_slash(T(lhs), rhs);
         }
     }
 
     template <typename T>
-    constexpr static auto operator_percent(const wide_integer<Bits, Signed> & lhs, const T & rhs)
+    constexpr static auto operator_percent(const integer<Bits, Signed> & lhs, const T & rhs)
     {
         if constexpr (should_keep_size<T>())
         {
-            wide_integer<Bits, Signed> o = rhs;
-            wide_integer<Bits, Signed> quotient{}, remainder{};
+            integer<Bits, Signed> o = rhs;
+            integer<Bits, Signed> quotient{}, remainder{};
             divide(make_positive(lhs), make_positive(o), quotient, remainder);
 
-            if (is_same<Signed, signed>::value && is_negative(lhs))
+            if (std::is_same_v<Signed, signed> && is_negative(lhs))
                 remainder = operator_unary_minus(remainder);
 
             return remainder;
@@ -770,18 +775,18 @@ public:
         else
         {
             static_assert(T::_impl::_is_wide_integer, "");
-            return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<T::_impl::_Bits, Signed>>::operator_percent(T(lhs), rhs);
+            return std::common_type_t<integer<Bits, Signed>, integer<T::_impl::_Bits, Signed>>::operator_percent(T(lhs), rhs);
         }
     }
 
     // ^
     template <typename T>
-    constexpr static auto operator_circumflex(const wide_integer<Bits, Signed> & lhs, const T & rhs) noexcept
+    constexpr static auto operator_circumflex(const integer<Bits, Signed> & lhs, const T & rhs) noexcept
     {
         if constexpr (should_keep_size<T>())
         {
-            wide_integer<Bits, Signed> t(rhs);
-            wide_integer<Bits, Signed> res = lhs;
+            integer<Bits, Signed> t(rhs);
+            integer<Bits, Signed> res = lhs;
 
             for (int i = 0; i < arr_size; ++i)
                 res.m_arr[any(i)] ^= t.m_arr[any(i)];
@@ -794,11 +799,11 @@ public:
         }
     }
 
-    constexpr static wide_integer<Bits, Signed> from_str(const char * c)
+    constexpr static integer<Bits, Signed> from_str(const char * c)
     {
-        wide_integer<Bits, Signed> res = 0;
+        integer<Bits, Signed> res = 0;
 
-        bool is_neg = is_same<Signed, signed>::value && *c == '-';
+        bool is_neg = std::is_same_v<Signed, signed> && *c == '-';
         if (is_neg)
             ++c;
 
@@ -827,7 +832,7 @@ public:
                     ++c;
                 }
                 else
-                    throw std::runtime_error("invalid char from");
+                    throwError("invalid char from");
             }
         }
         else
@@ -835,7 +840,7 @@ public:
             while (*c)
             {
                 if (*c < '0' || *c > '9')
-                    throw std::runtime_error("invalid char from");
+                    throwError("invalid char from");
 
                 res = operator_star(res, 10U);
                 res = operator_plus_T(res, *c - '0');
@@ -854,7 +859,7 @@ public:
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed>::wide_integer(T rhs) noexcept
+constexpr integer<Bits, Signed>::integer(T rhs) noexcept
     : m_arr{}
 {
     if constexpr (IsWideInteger<T>::value)
@@ -865,7 +870,7 @@ constexpr wide_integer<Bits, Signed>::wide_integer(T rhs) noexcept
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed>::wide_integer(std::initializer_list<T> il) noexcept
+constexpr integer<Bits, Signed>::integer(std::initializer_list<T> il) noexcept
     : m_arr{}
 {
     if (il.size() == 1)
@@ -881,7 +886,7 @@ constexpr wide_integer<Bits, Signed>::wide_integer(std::initializer_list<T> il)
 
 template <size_t Bits, typename Signed>
 template <size_t Bits2, typename Signed2>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator=(const wide_integer<Bits2, Signed2> & rhs) noexcept
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator=(const integer<Bits2, Signed2> & rhs) noexcept
 {
     _impl::wide_integer_from_wide_integer(*this, rhs);
     return *this;
@@ -889,7 +894,7 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator=(con
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator=(T rhs) noexcept
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator=(T rhs) noexcept
 {
     _impl::wide_integer_from_bultin(*this, rhs);
     return *this;
@@ -897,7 +902,7 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator=(T r
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator*=(const T & rhs)
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator*=(const T & rhs)
 {
     *this = *this * rhs;
     return *this;
@@ -905,7 +910,7 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator*=(co
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator/=(const T & rhs)
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator/=(const T & rhs)
 {
     *this = *this / rhs;
     return *this;
@@ -913,7 +918,7 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator/=(co
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator+=(const T & rhs) noexcept(is_same<Signed, unsigned>::value)
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator+=(const T & rhs) noexcept(std::is_same_v<Signed, unsigned>)
 {
     *this = *this + rhs;
     return *this;
@@ -921,7 +926,7 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator+=(co
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator-=(const T & rhs) noexcept(is_same<Signed, unsigned>::value)
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator-=(const T & rhs) noexcept(std::is_same_v<Signed, unsigned>)
 {
     *this = *this - rhs;
     return *this;
@@ -929,7 +934,7 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator-=(co
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator%=(const T & rhs)
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator%=(const T & rhs)
 {
     *this = *this % rhs;
     return *this;
@@ -937,7 +942,7 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator%=(co
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator&=(const T & rhs) noexcept
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator&=(const T & rhs) noexcept
 {
     *this = *this & rhs;
     return *this;
@@ -945,7 +950,7 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator&=(co
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator|=(const T & rhs) noexcept
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator|=(const T & rhs) noexcept
 {
     *this = *this | rhs;
     return *this;
@@ -953,35 +958,35 @@ constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator|=(co
 
 template <size_t Bits, typename Signed>
 template <typename T>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator^=(const T & rhs) noexcept
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator^=(const T & rhs) noexcept
 {
     *this = *this ^ rhs;
     return *this;
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator<<=(int n)
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator<<=(int n) noexcept
 {
     *this = _impl::shift_left(*this, n);
     return *this;
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator>>=(int n) noexcept
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator>>=(int n) noexcept
 {
     *this = _impl::shift_right(*this, n);
     return *this;
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator++() noexcept(is_same<Signed, unsigned>::value)
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator++() noexcept(std::is_same_v<Signed, unsigned>)
 {
     *this = _impl::operator_plus(*this, 1);
     return *this;
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> wide_integer<Bits, Signed>::operator++(int) noexcept(is_same<Signed, unsigned>::value)
+constexpr integer<Bits, Signed> integer<Bits, Signed>::operator++(int) noexcept(std::is_same_v<Signed, unsigned>)
 {
     auto tmp = *this;
     *this = _impl::operator_plus(*this, 1);
@@ -989,14 +994,14 @@ constexpr wide_integer<Bits, Signed> wide_integer<Bits, Signed>::operator++(int)
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> & wide_integer<Bits, Signed>::operator--() noexcept(is_same<Signed, unsigned>::value)
+constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator--() noexcept(std::is_same_v<Signed, unsigned>)
 {
     *this = _impl::operator_minus(*this, 1);
     return *this;
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> wide_integer<Bits, Signed>::operator--(int) noexcept(is_same<Signed, unsigned>::value)
+constexpr integer<Bits, Signed> integer<Bits, Signed>::operator--(int) noexcept(std::is_same_v<Signed, unsigned>)
 {
     auto tmp = *this;
     *this = _impl::operator_minus(*this, 1);
@@ -1004,14 +1009,14 @@ constexpr wide_integer<Bits, Signed> wide_integer<Bits, Signed>::operator--(int)
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed>::operator bool() const noexcept
+constexpr integer<Bits, Signed>::operator bool() const noexcept
 {
     return !_impl::operator_eq(*this, 0);
 }
 
 template <size_t Bits, typename Signed>
 template <class T, class>
-constexpr wide_integer<Bits, Signed>::operator T() const noexcept
+constexpr integer<Bits, Signed>::operator T() const noexcept
 {
     static_assert(std::numeric_limits<T>::is_integer, "");
     T res = 0;
@@ -1023,12 +1028,12 @@ constexpr wide_integer<Bits, Signed>::operator T() const noexcept
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed>::operator long double() const noexcept
+constexpr integer<Bits, Signed>::operator long double() const noexcept
 {
     if (_impl::operator_eq(*this, 0))
         return 0;
 
-    wide_integer<Bits, Signed> tmp = *this;
+    integer<Bits, Signed> tmp = *this;
     if (_impl::is_negative(*this))
         tmp = -tmp;
 
@@ -1048,42 +1053,45 @@ constexpr wide_integer<Bits, Signed>::operator long double() const noexcept
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed>::operator double() const noexcept
+constexpr integer<Bits, Signed>::operator double() const noexcept
 {
     return static_cast<long double>(*this);
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed>::operator float() const noexcept
+constexpr integer<Bits, Signed>::operator float() const noexcept
 {
     return static_cast<long double>(*this);
 }
 
 // Unary operators
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator~(const wide_integer<Bits, Signed> & lhs) noexcept
+constexpr integer<Bits, Signed> operator~(const integer<Bits, Signed> & lhs) noexcept
 {
-    return wide_integer<Bits, Signed>::_impl::operator_unary_tilda(lhs);
+    return integer<Bits, Signed>::_impl::operator_unary_tilda(lhs);
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator-(const wide_integer<Bits, Signed> & lhs) noexcept(is_same<Signed, unsigned>::value)
+constexpr integer<Bits, Signed> operator-(const integer<Bits, Signed> & lhs) noexcept(std::is_same_v<Signed, unsigned>)
 {
-    return wide_integer<Bits, Signed>::_impl::operator_unary_minus(lhs);
+    return integer<Bits, Signed>::_impl::operator_unary_minus(lhs);
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator+(const wide_integer<Bits, Signed> & lhs) noexcept(is_same<Signed, unsigned>::value)
+constexpr integer<Bits, Signed> operator+(const integer<Bits, Signed> & lhs) noexcept(std::is_same_v<Signed, unsigned>)
 {
     return lhs;
 }
 
+#define CT(x) \
+    std::common_type_t<std::decay_t<decltype(rhs)>, std::decay_t<decltype(lhs)>> { x }
+
 // Binary operators
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator*(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator*(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_star(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_star(lhs, rhs);
 }
 
 template <typename Arithmetic, typename Arithmetic2, class>
@@ -1093,10 +1101,10 @@ std::common_type_t<Arithmetic, Arithmetic2> constexpr operator*(const Arithmetic
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator/(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator/(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_slash(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_slash(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 std::common_type_t<Arithmetic, Arithmetic2> constexpr operator/(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1105,10 +1113,10 @@ std::common_type_t<Arithmetic, Arithmetic2> constexpr operator/(const Arithmetic
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator+(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator+(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_plus(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_plus(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 std::common_type_t<Arithmetic, Arithmetic2> constexpr operator+(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1117,10 +1125,10 @@ std::common_type_t<Arithmetic, Arithmetic2> constexpr operator+(const Arithmetic
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator-(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator-(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_minus(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_minus(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 std::common_type_t<Arithmetic, Arithmetic2> constexpr operator-(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1129,10 +1137,10 @@ std::common_type_t<Arithmetic, Arithmetic2> constexpr operator-(const Arithmetic
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator%(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator%(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_percent(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_percent(lhs, rhs);
 }
 template <typename Integral, typename Integral2, class>
 std::common_type_t<Integral, Integral2> constexpr operator%(const Integral & lhs, const Integral2 & rhs)
@@ -1141,10 +1149,10 @@ std::common_type_t<Integral, Integral2> constexpr operator%(const Integral & lhs
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator&(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator&(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_amp(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_amp(lhs, rhs);
 }
 template <typename Integral, typename Integral2, class>
 std::common_type_t<Integral, Integral2> constexpr operator&(const Integral & lhs, const Integral2 & rhs)
@@ -1153,10 +1161,10 @@ std::common_type_t<Integral, Integral2> constexpr operator&(const Integral & lhs
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator|(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator|(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_pipe(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_pipe(lhs, rhs);
 }
 template <typename Integral, typename Integral2, class>
 std::common_type_t<Integral, Integral2> constexpr operator|(const Integral & lhs, const Integral2 & rhs)
@@ -1165,10 +1173,10 @@ std::common_type_t<Integral, Integral2> constexpr operator|(const Integral & lhs
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>> constexpr
-operator^(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>> constexpr
+operator^(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_circumflex(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_circumflex(lhs, rhs);
 }
 template <typename Integral, typename Integral2, class>
 std::common_type_t<Integral, Integral2> constexpr operator^(const Integral & lhs, const Integral2 & rhs)
@@ -1177,20 +1185,20 @@ std::common_type_t<Integral, Integral2> constexpr operator^(const Integral & lhs
 }
 
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator<<(const wide_integer<Bits, Signed> & lhs, int n) noexcept
+constexpr integer<Bits, Signed> operator<<(const integer<Bits, Signed> & lhs, int n) noexcept
 {
-    return wide_integer<Bits, Signed>::_impl::shift_left(lhs, n);
+    return integer<Bits, Signed>::_impl::shift_left(lhs, n);
 }
 template <size_t Bits, typename Signed>
-constexpr wide_integer<Bits, Signed> operator>>(const wide_integer<Bits, Signed> & lhs, int n) noexcept
+constexpr integer<Bits, Signed> operator>>(const integer<Bits, Signed> & lhs, int n) noexcept
 {
-    return wide_integer<Bits, Signed>::_impl::shift_right(lhs, n);
+    return integer<Bits, Signed>::_impl::shift_right(lhs, n);
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator<(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+constexpr bool operator<(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_less(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_less(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 constexpr bool operator<(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1199,9 +1207,9 @@ constexpr bool operator<(const Arithmetic & lhs, const Arithmetic2 & rhs)
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator>(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+constexpr bool operator>(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_more(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_more(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 constexpr bool operator>(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1210,10 +1218,10 @@ constexpr bool operator>(const Arithmetic & lhs, const Arithmetic2 & rhs)
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator<=(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+constexpr bool operator<=(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_less(lhs, rhs)
-        || std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_eq(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_less(lhs, rhs)
+        || std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_eq(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 constexpr bool operator<=(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1222,10 +1230,10 @@ constexpr bool operator<=(const Arithmetic & lhs, const Arithmetic2 & rhs)
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator>=(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+constexpr bool operator>=(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_more(lhs, rhs)
-        || std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_eq(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_more(lhs, rhs)
+        || std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_eq(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 constexpr bool operator>=(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1234,9 +1242,9 @@ constexpr bool operator>=(const Arithmetic & lhs, const Arithmetic2 & rhs)
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator==(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+constexpr bool operator==(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_eq(lhs, rhs);
+    return std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_eq(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 constexpr bool operator==(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1245,9 +1253,9 @@ constexpr bool operator==(const Arithmetic & lhs, const Arithmetic2 & rhs)
 }
 
 template <size_t Bits, typename Signed, size_t Bits2, typename Signed2>
-constexpr bool operator!=(const wide_integer<Bits, Signed> & lhs, const wide_integer<Bits2, Signed2> & rhs)
+constexpr bool operator!=(const integer<Bits, Signed> & lhs, const integer<Bits2, Signed2> & rhs)
 {
-    return !std::common_type_t<wide_integer<Bits, Signed>, wide_integer<Bits2, Signed2>>::_impl::operator_eq(lhs, rhs);
+    return !std::common_type_t<integer<Bits, Signed>, integer<Bits2, Signed2>>::_impl::operator_eq(lhs, rhs);
 }
 template <typename Arithmetic, typename Arithmetic2, class>
 constexpr bool operator!=(const Arithmetic & lhs, const Arithmetic2 & rhs)
@@ -1255,35 +1263,17 @@ constexpr bool operator!=(const Arithmetic & lhs, const Arithmetic2 & rhs)
     return CT(lhs) != CT(rhs);
 }
 
-template <size_t Bits, typename Signed>
-inline std::string to_string(const wide_integer<Bits, Signed> & n)
-{
-    std::string res;
-    if (wide_integer<Bits, Signed>::_impl::operator_eq(n, 0U))
-        return "0";
+#undef CT
 
-    wide_integer<Bits, unsigned> t;
-    bool is_neg = wide_integer<Bits, Signed>::_impl::is_negative(n);
-    if (is_neg)
-        t = wide_integer<Bits, Signed>::_impl::operator_unary_minus(n);
-    else
-        t = n;
-
-    while (!wide_integer<Bits, unsigned>::_impl::operator_eq(t, 0U))
-    {
-        res.insert(res.begin(), '0' + char(wide_integer<Bits, unsigned>::_impl::operator_percent(t, 10U)));
-        t = wide_integer<Bits, unsigned>::_impl::operator_slash(t, 10U);
-    }
-
-    if (is_neg)
-        res.insert(res.begin(), '-');
-    return res;
 }
 
-template <size_t Bits, typename Signed>
-struct hash<wide_integer<Bits, Signed>>
+namespace std
 {
-    std::size_t operator()(const wide_integer<Bits, Signed> & lhs) const
+
+template <size_t Bits, typename Signed>
+struct hash<wide::integer<Bits, Signed>>
+{
+    std::size_t operator()(const wide::integer<Bits, Signed> & lhs) const
     {
         static_assert(Bits % (sizeof(size_t) * 8) == 0);
 
@@ -1293,9 +1283,8 @@ struct hash<wide_integer<Bits, Signed>>
         size_t res = 0;
         for (unsigned i = 0; i < count; ++i)
             res ^= ptr[i];
-        return hash<size_t>()(res);
+        return res;
     }
 };
 
-#undef CT
 }
diff --git a/base/common/wide_integer_to_string.h b/base/common/wide_integer_to_string.h
new file mode 100644
index 00000000000..9908ef4be7a
--- /dev/null
+++ b/base/common/wide_integer_to_string.h
@@ -0,0 +1,35 @@
+#pragma once
+
+#include <string>
+
+#include "wide_integer.h"
+
+namespace wide
+{
+
+template <size_t Bits, typename Signed>
+inline std::string to_string(const integer<Bits, Signed> & n)
+{
+    std::string res;
+    if (integer<Bits, Signed>::_impl::operator_eq(n, 0U))
+        return "0";
+
+    integer<Bits, unsigned> t;
+    bool is_neg = integer<Bits, Signed>::_impl::is_negative(n);
+    if (is_neg)
+        t = integer<Bits, Signed>::_impl::operator_unary_minus(n);
+    else
+        t = n;
+
+    while (!integer<Bits, unsigned>::_impl::operator_eq(t, 0U))
+    {
+        res.insert(res.begin(), '0' + char(integer<Bits, unsigned>::_impl::operator_percent(t, 10U)));
+        t = integer<Bits, unsigned>::_impl::operator_slash(t, 10U);
+    }
+
+    if (is_neg)
+        res.insert(res.begin(), '-');
+    return res;
+}
+
+}
diff --git a/src/IO/WriteHelpers.h b/src/IO/WriteHelpers.h
index 3b9eced09bd..1f0fe095059 100644
--- a/src/IO/WriteHelpers.h
+++ b/src/IO/WriteHelpers.h
@@ -11,6 +11,7 @@
 #include <common/LocalDateTime.h>
 #include <common/find_symbols.h>
 #include <common/StringRef.h>
+#include <common/wide_integer_to_string.h>
 
 #include <Core/DecimalFunctions.h>
 #include <Core/Types.h>
@@ -42,6 +43,12 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
+template <typename T>
+inline std::string bigintToString(const T & x)
+{
+    return to_string(x);
+}
+
 /// Helper functions for formatted and binary output.
 
 inline void writeChar(char x, WriteBuffer & buf)
diff --git a/tests/queries/0_stateless/01475_fix_bigint_shift.reference b/tests/queries/0_stateless/01475_fix_bigint_shift.reference
new file mode 100644
index 00000000000..c278273c760
--- /dev/null
+++ b/tests/queries/0_stateless/01475_fix_bigint_shift.reference
@@ -0,0 +1,2 @@
+-4
+-4
diff --git a/tests/queries/0_stateless/01475_fix_bigint_shift.sql b/tests/queries/0_stateless/01475_fix_bigint_shift.sql
new file mode 100644
index 00000000000..d16cdeca85d
--- /dev/null
+++ b/tests/queries/0_stateless/01475_fix_bigint_shift.sql
@@ -0,0 +1,2 @@
+SELECT bitShiftLeft(toInt64(-2), 1);
+SELECT bitShiftLeft(toInt256(-2), 1);

From 393c213866ff56ef98ae2f66ee50afebc9459319 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 14 Sep 2020 15:24:38 +0300
Subject: [PATCH 178/341] Revert changes

---
 docker/packager/deb/Dockerfile     |  9 ++++++++-
 docker/packager/deb/build.sh       | 19 -------------------
 docker/packager/unbundled/build.sh | 19 -------------------
 3 files changed, 8 insertions(+), 39 deletions(-)

diff --git a/docker/packager/deb/Dockerfile b/docker/packager/deb/Dockerfile
index 9c24e9600eb..a3c87f13fe4 100644
--- a/docker/packager/deb/Dockerfile
+++ b/docker/packager/deb/Dockerfile
@@ -24,9 +24,16 @@ RUN apt-get update \
         software-properties-common \
         --yes --no-install-recommends
 
+# Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
+# to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
+# Significantly increase deb packaging speed and compatible with old systems
+RUN curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb \
+    && chmod +x dpkg-deb \
+    && cp dpkg-deb /usr/bin
+
 ENV APACHE_PUBKEY_HASH="bba6987b63c63f710fd4ed476121c588bc3812e99659d27a855f8c4d312783ee66ad6adfce238765691b04d62fa3688f"
 
-RUN export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
+RUN  export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
     && wget -nv -O /tmp/arrow-keyring.deb "https://apache.bintray.com/arrow/ubuntu/apache-arrow-archive-keyring-latest-${CODENAME}.deb" \
     && echo "${APACHE_PUBKEY_HASH} /tmp/arrow-keyring.deb" | sha384sum -c \
     && dpkg -i /tmp/arrow-keyring.deb
diff --git a/docker/packager/deb/build.sh b/docker/packager/deb/build.sh
index 8ebf3caca59..fbaa0151c6b 100755
--- a/docker/packager/deb/build.sh
+++ b/docker/packager/deb/build.sh
@@ -2,25 +2,6 @@
 
 set -x -e
 
-# Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
-# to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
-# Significantly increase deb packaging speed and compatible with old systems
-
-counter=0
-until curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb
-do
-    sleep 0.5
-    counter=$(($counter + 1))
-    echo "Cannot fetch better dpgk, retry $counter"
-    if [ "$counter" -gt 120 ]
-    then
-        echo "Cannot fetch busybox image all retries exceeded"
-        exit 1
-    fi
-done
-
-chmod +x dpkg-deb && cp dpkg-deb /usr/bin
-
 ccache --show-stats ||:
 ccache --zero-stats ||:
 build/release --no-pbuilder $ALIEN_PKGS | ts '%Y-%m-%d %H:%M:%S'
diff --git a/docker/packager/unbundled/build.sh b/docker/packager/unbundled/build.sh
index 77c27ce4a2c..ca1217ac522 100755
--- a/docker/packager/unbundled/build.sh
+++ b/docker/packager/unbundled/build.sh
@@ -2,25 +2,6 @@
 
 set -x -e
 
-# Special dpkg-deb (https://github.com/ClickHouse-Extras/dpkg) version which is able
-# to compress files using pigz (https://zlib.net/pigz/) instead of gzip.
-# Significantly increase deb packaging speed and compatible with old systems
-
-counter=0
-until curl -O https://clickhouse-builds.s3.yandex.net/utils/1/dpkg-deb
-do
-    sleep 0.5
-    counter=$(($counter + 1))
-    echo "Cannot fetch better dpgk, retry $counter"
-    if [ "$counter" -gt 120 ]
-    then
-        echo "Cannot fetch busybox image all retries exceeded"
-        exit 1
-    fi
-done
-
-chmod +x dpkg-deb && cp dpkg-deb /usr/bin
-
 ccache --show-stats ||:
 ccache --zero-stats ||:
 build/release --no-pbuilder $ALIEN_PKGS | ts '%Y-%m-%d %H:%M:%S'

From 709b0f138a429531b67d9d0cec741e9573d26c9a Mon Sep 17 00:00:00 2001
From: filimonov <1549571+filimonov@users.noreply.github.com>
Date: Mon, 14 Sep 2020 14:55:40 +0200
Subject: [PATCH 179/341] Update clickhouse-benchmark.md

---
 docs/en/operations/utilities/clickhouse-benchmark.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/utilities/clickhouse-benchmark.md b/docs/en/operations/utilities/clickhouse-benchmark.md
index ab67ca197dd..f948630b7bb 100644
--- a/docs/en/operations/utilities/clickhouse-benchmark.md
+++ b/docs/en/operations/utilities/clickhouse-benchmark.md
@@ -38,7 +38,7 @@ clickhouse-benchmark [keys] < queries_file
 -   `-d N`, `--delay=N` — Interval in seconds between intermediate reports (set 0 to disable reports). Default value: 1.
 -   `-h WORD`, `--host=WORD` — Server host. Default value: `localhost`. For the [comparison mode](#clickhouse-benchmark-comparison-mode) you can use multiple `-h` keys.
 -   `-p N`, `--port=N` — Server port. Default value: 9000. For the [comparison mode](#clickhouse-benchmark-comparison-mode) you can use multiple `-p` keys.
--   `-i N`, `--iterations=N` — Total number of queries. Default value: 0.
+-   `-i N`, `--iterations=N` — Total number of queries. Default value: 0 (repeat forever).
 -   `-r`, `--randomize` — Random order of queries execution if there is more then one input query.
 -   `-s`, `--secure` — Using TLS connection.
 -   `-t N`, `--timelimit=N` — Time limit in seconds. `clickhouse-benchmark` stops sending queries when the specified time limit is reached. Default value: 0 (time limit disabled).

From b9666979391f1a69ac701e167759823c758b9ef5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 16:31:30 +0300
Subject: [PATCH 180/341] Style

---
 src/Common/remapExecutable.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/remapExecutable.cpp b/src/Common/remapExecutable.cpp
index 6b86e8717a4..3e9d1ebc710 100644
--- a/src/Common/remapExecutable.cpp
+++ b/src/Common/remapExecutable.cpp
@@ -74,7 +74,7 @@ std::pair<void *, size_t> getMappedArea(void * ptr)
 
 __attribute__((__noinline__)) int64_t our_syscall(...)
 {
-     __asm__ __volatile__ (R"(
+    __asm__ __volatile__ (R"(
         movq %%rdi,%%rax;
         movq %%rsi,%%rdi;
         movq %%rdx,%%rsi;

From 882206c0b6fd2acb59ee730ff0b18b01db674b93 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 16:45:32 +0300
Subject: [PATCH 181/341] Update InterpreterInsertQuery.cpp

---
 src/Interpreters/InterpreterInsertQuery.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index 01fee30a445..5985a7fb7d6 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -93,6 +93,8 @@ Block InterpreterInsertQuery::getSampleBlock(
     }
 
     Block table_sample = metadata_snapshot->getSampleBlock();
+
+    /// Process column transformers (e.g. * EXCEPT(a)), asterisks and qualified columns.
     const auto & columns = metadata_snapshot->getColumns();
     auto names_and_types = columns.getOrdinary();
     removeDuplicateColumns(names_and_types);

From 9d9b579291e51df4eb357a9ff742b07d5b8c582b Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 16:48:18 +0300
Subject: [PATCH 182/341] Update CHANGELOG.md

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index f3266520eb1..23107434024 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -18,7 +18,7 @@
 * Add function `defaultValueOfTypeName` that returns the default value for a given type. [#13877](https://github.com/ClickHouse/ClickHouse/pull/13877) ([hcz](https://github.com/hczhcz)).
 * Add `quantileExactLow` and `quantileExactHigh` implementations with respective aliases for `medianExactLow` and `medianExactHigh`. [#13818](https://github.com/ClickHouse/ClickHouse/pull/13818) ([Bharat Nallan](https://github.com/bharatnc)).
 * Add function `normalizeQuery` that replaces literals, sequences of literals and complex aliases with placeholders. Add function `normalizedQueryHash` that returns identical 64bit hash values for similar queries. It helps to analyze query log. This closes [#11271](https://github.com/ClickHouse/ClickHouse/issues/11271). [#13816](https://github.com/ClickHouse/ClickHouse/pull/13816) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Add new optional section <user_directories> to the main config. [#13425](https://github.com/ClickHouse/ClickHouse/pull/13425) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Add new optional section `<user_directories>` to the main config. [#13425](https://github.com/ClickHouse/ClickHouse/pull/13425) ([Vitaly Baranov](https://github.com/vitlibar)).
 * Add `ALTER SAMPLE BY` statement that allows to change table sample clause. [#13280](https://github.com/ClickHouse/ClickHouse/pull/13280) ([Amos Bird](https://github.com/amosbird)).
 * Function `position` now supports optional `start_pos` argument. [#13237](https://github.com/ClickHouse/ClickHouse/pull/13237) ([vdimir](https://github.com/vdimir)).
 * Add types `Int128`, `Int256`, `UInt256` and related functions for them. Extend Decimals with Decimal256 (precision up to 76 digits). New types are under the setting `allow_experimental_bigint_types`. [#13097](https://github.com/ClickHouse/ClickHouse/pull/13097) ([Artem Zuikov](https://github.com/4ertus2)).

From b5620018ca38a0c6a65a617dc9511b87afd3ce79 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 17:02:10 +0300
Subject: [PATCH 183/341] Fix for #14761

---
 src/Functions/GatherUtils/CMakeLists.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/GatherUtils/CMakeLists.txt b/src/Functions/GatherUtils/CMakeLists.txt
index f941091667e..b9b9a981110 100644
--- a/src/Functions/GatherUtils/CMakeLists.txt
+++ b/src/Functions/GatherUtils/CMakeLists.txt
@@ -3,8 +3,8 @@ add_headers_and_sources(clickhouse_functions_gatherutils .)
 add_library(clickhouse_functions_gatherutils ${clickhouse_functions_gatherutils_sources} ${clickhouse_functions_gatherutils_headers})
 target_link_libraries(clickhouse_functions_gatherutils PRIVATE dbms)
 
-check_cxx_compiler_flag(suggest-override HAS_SUGGEST_OVERRIDE)
-check_cxx_compiler_flag(suggest-destructor-override HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
+check_cxx_compiler_flag("-Wsuggest-override" HAS_SUGGEST_OVERRIDE)
+check_cxx_compiler_flag("-Wsuggest-destructor-override" HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
 
 if (HAS_SUGGEST_OVERRIDE)
     target_compile_definitions(clickhouse_functions_gatherutils PRIVATE HAS_SUGGEST_OVERRIDE)

From bcfc83022ad195b9238950789516d5b294fff2ca Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 17:13:58 +0300
Subject: [PATCH 184/341] Return query plan from storage.

---
 src/DataStreams/IBlockInputStream.h           | 26 +---------
 src/DataStreams/LocalLimits.h                 | 32 ++++++++++++
 src/Interpreters/InterpreterSelectQuery.cpp   | 41 ++++++++++++++--
 src/Interpreters/InterpreterWatchQuery.cpp    |  5 +-
 src/Interpreters/executeQuery.cpp             |  4 +-
 .../PipelineExecutingBlockInputStream.cpp     |  2 +-
 src/Processors/Pipe.cpp                       |  2 +-
 src/Processors/Pipe.h                         |  4 +-
 .../QueryPlan/PartialSortingStep.cpp          |  2 +-
 .../QueryPlan/ReadFromStorageStep.cpp         | 49 ++++---------------
 .../QueryPlan/ReadFromStorageStep.h           | 12 +++--
 src/Processors/Sources/SourceWithProgress.h   |  7 +--
 .../Transforms/LimitsCheckingTransform.h      |  5 +-
 src/Storages/IStorage.cpp                     | 22 +++++++++
 src/Storages/IStorage.h                       | 14 ++++++
 src/Storages/Kafka/StorageKafka.cpp           |  2 +-
 src/Storages/RabbitMQ/StorageRabbitMQ.cpp     |  2 +-
 17 files changed, 137 insertions(+), 94 deletions(-)
 create mode 100644 src/DataStreams/LocalLimits.h

diff --git a/src/DataStreams/IBlockInputStream.h b/src/DataStreams/IBlockInputStream.h
index 34e7bbac034..f2aa4dd1b5c 100644
--- a/src/DataStreams/IBlockInputStream.h
+++ b/src/DataStreams/IBlockInputStream.h
@@ -5,6 +5,7 @@
 #include <DataStreams/IBlockStream_fwd.h>
 #include <DataStreams/SizeLimits.h>
 #include <DataStreams/ExecutionSpeedLimits.h>
+#include <DataStreams/LocalLimits.h>
 #include <IO/Progress.h>
 #include <Storages/TableLockHolder.h>
 #include <Common/TypePromotion.h>
@@ -173,31 +174,6 @@ public:
     bool isCancelled() const;
     bool isCancelledOrThrowIfKilled() const;
 
-    /** What limitations and quotas should be checked.
-      * LIMITS_CURRENT - checks amount of data returned by current stream only (BlockStreamProfileInfo is used for check).
-      *  Currently it is used in root streams to check max_result_{rows,bytes} limits.
-      * LIMITS_TOTAL - checks total amount of read data from leaf streams (i.e. data read from disk and remote servers).
-      *  It is checks max_{rows,bytes}_to_read in progress handler and use info from ProcessListElement::progress_in for this.
-      *  Currently this check is performed only in leaf streams.
-      */
-    enum LimitsMode
-    {
-        LIMITS_CURRENT,
-        LIMITS_TOTAL,
-    };
-
-    /// It is a subset of limitations from Limits.
-    struct LocalLimits
-    {
-        LimitsMode mode = LIMITS_CURRENT;
-
-        SizeLimits size_limits;
-
-        ExecutionSpeedLimits speed_limits;
-
-        OverflowMode timeout_overflow_mode = OverflowMode::THROW;
-    };
-
     /** Set limitations that checked on each block. */
     virtual void setLimits(const LocalLimits & limits_)
     {
diff --git a/src/DataStreams/LocalLimits.h b/src/DataStreams/LocalLimits.h
new file mode 100644
index 00000000000..454721a307f
--- /dev/null
+++ b/src/DataStreams/LocalLimits.h
@@ -0,0 +1,32 @@
+#include <DataStreams/SizeLimits.h>
+#include <DataStreams/ExecutionSpeedLimits.h>
+
+namespace DB
+{
+
+/** What limitations and quotas should be checked.
+  * LIMITS_CURRENT - checks amount of data returned by current stream only (BlockStreamProfileInfo is used for check).
+  *  Currently it is used in root streams to check max_result_{rows,bytes} limits.
+  * LIMITS_TOTAL - checks total amount of read data from leaf streams (i.e. data read from disk and remote servers).
+  *  It is checks max_{rows,bytes}_to_read in progress handler and use info from ProcessListElement::progress_in for this.
+  *  Currently this check is performed only in leaf streams.
+  */
+enum class LimitsMode
+{
+    LIMITS_CURRENT,
+    LIMITS_TOTAL,
+};
+
+/// It is a subset of limitations from Limits.
+struct LocalLimits
+{
+    LimitsMode mode = LimitsMode::LIMITS_CURRENT;
+
+    SizeLimits size_limits;
+
+    ExecutionSpeedLimits speed_limits;
+
+    OverflowMode timeout_overflow_mode = OverflowMode::THROW;
+};
+
+}
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index dbf6d5ae8d3..98a258a0c35 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -1409,12 +1409,43 @@ void InterpreterSelectQuery::executeFetchColumns(
             query_info.input_order_info = query_info.order_optimizer->getInputOrder(storage, metadata_snapshot);
         }
 
-        auto read_step = std::make_unique<ReadFromStorageStep>(
-            table_lock, metadata_snapshot, options, storage,
-                required_columns, query_info, context, processing_stage, max_block_size, max_streams);
+        LocalLimits limits;
+        std::shared_ptr<const EnabledQuota> quota;
 
-        read_step->setStepDescription("Read from " + storage->getName());
-        query_plan.addStep(std::move(read_step));
+        /// Set the limits and quota for reading data, the speed and time of the query.
+        if (!options.ignore_limits)
+        {
+            limits.mode = LimitsMode::LIMITS_TOTAL;
+            limits.size_limits = SizeLimits(settings.max_rows_to_read, settings.max_bytes_to_read,
+                                            settings.read_overflow_mode);
+            limits.speed_limits.max_execution_time = settings.max_execution_time;
+            limits.timeout_overflow_mode = settings.timeout_overflow_mode;
+
+            /** Quota and minimal speed restrictions are checked on the initiating server of the request, and not on remote servers,
+              *  because the initiating server has a summary of the execution of the request on all servers.
+              *
+              * But limits on data size to read and maximum execution time are reasonable to check both on initiator and
+              *  additionally on each remote server, because these limits are checked per block of data processed,
+              *  and remote servers may process way more blocks of data than are received by initiator.
+              *
+              * The limits to throttle maximum execution speed is also checked on all servers.
+              */
+            if (options.to_stage == QueryProcessingStage::Complete)
+            {
+                limits.speed_limits.min_execution_rps = settings.min_execution_speed;
+                limits.speed_limits.min_execution_bps = settings.min_execution_speed_bytes;
+            }
+
+            limits.speed_limits.max_execution_rps = settings.max_execution_speed;
+            limits.speed_limits.max_execution_bps = settings.max_execution_speed_bytes;
+            limits.speed_limits.timeout_before_checking_execution_speed = settings.timeout_before_checking_execution_speed;
+        }
+
+        if (!options.ignore_quota && (options.to_stage == QueryProcessingStage::Complete))
+            quota = context->getQuota();
+
+        storage->read(query_plan, table_lock, metadata_snapshot, limits, std::move(quota),
+                      required_columns, query_info, context, processing_stage, max_block_size, max_streams);
     }
     else
         throw Exception("Logical error in InterpreterSelectQuery: nowhere to read", ErrorCodes::LOGICAL_ERROR);
diff --git a/src/Interpreters/InterpreterWatchQuery.cpp b/src/Interpreters/InterpreterWatchQuery.cpp
index 71ec1609046..caf67523fc9 100644
--- a/src/Interpreters/InterpreterWatchQuery.cpp
+++ b/src/Interpreters/InterpreterWatchQuery.cpp
@@ -17,6 +17,7 @@ limitations under the License. */
 #include <Access/AccessFlags.h>
 #include <DataStreams/IBlockInputStream.h>
 #include <DataStreams/OneBlockInputStream.h>
+#include <DataStreams/LocalLimits.h>
 
 
 namespace DB
@@ -76,8 +77,8 @@ BlockIO InterpreterWatchQuery::execute()
     /// Constraints on the result, the quota on the result, and also callback for progress.
     if (IBlockInputStream * stream = dynamic_cast<IBlockInputStream *>(streams[0].get()))
     {
-        IBlockInputStream::LocalLimits limits;
-        limits.mode = IBlockInputStream::LIMITS_CURRENT;
+        LocalLimits limits;
+        limits.mode = LimitsMode::LIMITS_CURRENT;
         limits.size_limits.max_rows = settings.max_result_rows;
         limits.size_limits.max_bytes = settings.max_result_bytes;
         limits.size_limits.overflow_mode = settings.result_overflow_mode;
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 478eed65ae1..bcf77fdf700 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -382,10 +382,10 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
             }
         }
 
-        IBlockInputStream::LocalLimits limits;
+        LocalLimits limits;
         if (!interpreter->ignoreLimits())
         {
-            limits.mode = IBlockInputStream::LIMITS_CURRENT;
+            limits.mode = LimitsMode::LIMITS_CURRENT;
             limits.size_limits = SizeLimits(settings.max_result_rows, settings.max_result_bytes, settings.result_overflow_mode);
         }
 
diff --git a/src/Processors/Executors/PipelineExecutingBlockInputStream.cpp b/src/Processors/Executors/PipelineExecutingBlockInputStream.cpp
index ba42d858d50..3f6ff2f7576 100644
--- a/src/Processors/Executors/PipelineExecutingBlockInputStream.cpp
+++ b/src/Processors/Executors/PipelineExecutingBlockInputStream.cpp
@@ -103,7 +103,7 @@ void PipelineExecutingBlockInputStream::setProcessListElement(QueryStatus * elem
     pipeline->setProcessListElement(elem);
 }
 
-void PipelineExecutingBlockInputStream::setLimits(const IBlockInputStream::LocalLimits & limits_)
+void PipelineExecutingBlockInputStream::setLimits(const LocalLimits & limits_)
 {
     throwIfExecutionStarted(is_execution_started, "setLimits");
 
diff --git a/src/Processors/Pipe.cpp b/src/Processors/Pipe.cpp
index 40ace269ec8..69433ab3b7c 100644
--- a/src/Processors/Pipe.cpp
+++ b/src/Processors/Pipe.cpp
@@ -779,7 +779,7 @@ void Pipe::transform(const Transformer & transformer)
     max_parallel_streams = std::max<size_t>(max_parallel_streams, output_ports.size());
 }
 
-void Pipe::setLimits(const ISourceWithProgress::LocalLimits & limits)
+void Pipe::setLimits(const LocalLimits & limits)
 {
     for (auto & processor : processors)
     {
diff --git a/src/Processors/Pipe.h b/src/Processors/Pipe.h
index c9ce67dd53f..c1bfb6a0e1e 100644
--- a/src/Processors/Pipe.h
+++ b/src/Processors/Pipe.h
@@ -6,6 +6,8 @@
 namespace DB
 {
 
+struct LocalLimits;
+
 class Pipe;
 using Pipes = std::vector<Pipe>;
 
@@ -94,7 +96,7 @@ public:
     const Processors & getProcessors() const { return processors; }
 
     /// Specify quotas and limits for every ISourceWithProgress.
-    void setLimits(const SourceWithProgress::LocalLimits & limits);
+    void setLimits(const LocalLimits & limits);
     void setQuota(const std::shared_ptr<const EnabledQuota> & quota);
 
     /// Do not allow to change the table while the processors of pipe are alive.
diff --git a/src/Processors/QueryPlan/PartialSortingStep.cpp b/src/Processors/QueryPlan/PartialSortingStep.cpp
index b56d8895471..4b8b35cd3e2 100644
--- a/src/Processors/QueryPlan/PartialSortingStep.cpp
+++ b/src/Processors/QueryPlan/PartialSortingStep.cpp
@@ -56,7 +56,7 @@ void PartialSortingStep::transformPipeline(QueryPipeline & pipeline)
         return std::make_shared<PartialSortingTransform>(header, sort_description, limit);
     });
 
-    IBlockInputStream::LocalLimits limits;
+    LocalLimits limits;
     limits.mode = IBlockInputStream::LIMITS_CURRENT;
     limits.size_limits = size_limits;
 
diff --git a/src/Processors/QueryPlan/ReadFromStorageStep.cpp b/src/Processors/QueryPlan/ReadFromStorageStep.cpp
index 3af011d1333..61b160f7e77 100644
--- a/src/Processors/QueryPlan/ReadFromStorageStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromStorageStep.cpp
@@ -13,8 +13,9 @@ namespace DB
 
 ReadFromStorageStep::ReadFromStorageStep(
     TableLockHolder table_lock_,
-    StorageMetadataPtr & metadata_snapshot_,
-    SelectQueryOptions options_,
+    StorageMetadataPtr metadata_snapshot_,
+    LocalLimits & limits_,
+    std::shared_ptr<const EnabledQuota> quota_,
     StoragePtr storage_,
     const Names & required_columns_,
     const SelectQueryInfo & query_info_,
@@ -23,8 +24,9 @@ ReadFromStorageStep::ReadFromStorageStep(
     size_t max_block_size_,
     size_t max_streams_)
     : table_lock(std::move(table_lock_))
-    , metadata_snapshot(metadata_snapshot_)
-    , options(std::move(options_))
+    , metadata_snapshot(std::move(metadata_snapshot_))
+    , limits(limits_)
+    , quota(std::move(quota_))
     , storage(std::move(storage_))
     , required_columns(required_columns_)
     , query_info(query_info_)
@@ -82,43 +84,10 @@ ReadFromStorageStep::ReadFromStorageStep(
     /// Table lock is stored inside pipeline here.
     pipeline->addTableLock(table_lock);
 
-    /// Set the limits and quota for reading data, the speed and time of the query.
-    {
-        const Settings & settings = context->getSettingsRef();
+    pipe.setLimits(limits);
 
-        IBlockInputStream::LocalLimits limits;
-        limits.mode = IBlockInputStream::LIMITS_TOTAL;
-        limits.size_limits = SizeLimits(settings.max_rows_to_read, settings.max_bytes_to_read, settings.read_overflow_mode);
-        limits.speed_limits.max_execution_time = settings.max_execution_time;
-        limits.timeout_overflow_mode = settings.timeout_overflow_mode;
-
-        /** Quota and minimal speed restrictions are checked on the initiating server of the request, and not on remote servers,
-          *  because the initiating server has a summary of the execution of the request on all servers.
-          *
-          * But limits on data size to read and maximum execution time are reasonable to check both on initiator and
-          *  additionally on each remote server, because these limits are checked per block of data processed,
-          *  and remote servers may process way more blocks of data than are received by initiator.
-          *
-          * The limits to throttle maximum execution speed is also checked on all servers.
-          */
-        if (options.to_stage == QueryProcessingStage::Complete)
-        {
-            limits.speed_limits.min_execution_rps = settings.min_execution_speed;
-            limits.speed_limits.min_execution_bps = settings.min_execution_speed_bytes;
-        }
-
-        limits.speed_limits.max_execution_rps = settings.max_execution_speed;
-        limits.speed_limits.max_execution_bps = settings.max_execution_speed_bytes;
-        limits.speed_limits.timeout_before_checking_execution_speed = settings.timeout_before_checking_execution_speed;
-
-        auto quota = context->getQuota();
-
-        if (!options.ignore_limits)
-            pipe.setLimits(limits);
-
-        if (!options.ignore_quota && (options.to_stage == QueryProcessingStage::Complete))
-            pipe.setQuota(quota);
-    }
+    if (quota)
+        pipe.setQuota(quota);
 
     pipeline->init(std::move(pipe));
 
diff --git a/src/Processors/QueryPlan/ReadFromStorageStep.h b/src/Processors/QueryPlan/ReadFromStorageStep.h
index fce69bb0f0f..064e4713099 100644
--- a/src/Processors/QueryPlan/ReadFromStorageStep.h
+++ b/src/Processors/QueryPlan/ReadFromStorageStep.h
@@ -1,7 +1,7 @@
 #include <Processors/QueryPlan/IQueryPlanStep.h>
 #include <Core/QueryProcessingStage.h>
 #include <Storages/TableLockHolder.h>
-#include <Interpreters/SelectQueryOptions.h>
+#include <DataStreams/LocalLimits.h>
 
 namespace DB
 {
@@ -16,14 +16,17 @@ struct SelectQueryInfo;
 
 struct PrewhereInfo;
 
+class EnabledQuota;
+
 /// Reads from storage.
 class ReadFromStorageStep : public IQueryPlanStep
 {
 public:
     ReadFromStorageStep(
         TableLockHolder table_lock,
-        StorageMetadataPtr & metadata_snapshot,
-        SelectQueryOptions options,
+        StorageMetadataPtr metadata_snapshot,
+        LocalLimits & limits,
+        std::shared_ptr<const EnabledQuota> quota,
         StoragePtr storage,
         const Names & required_columns,
         const SelectQueryInfo & query_info,
@@ -43,7 +46,8 @@ public:
 private:
     TableLockHolder table_lock;
     StorageMetadataPtr metadata_snapshot;
-    SelectQueryOptions options;
+    LocalLimits limits;
+    std::shared_ptr<const EnabledQuota> quota;
 
     StoragePtr storage;
     const Names & required_columns;
diff --git a/src/Processors/Sources/SourceWithProgress.h b/src/Processors/Sources/SourceWithProgress.h
index 34810045143..04e22d57c9c 100644
--- a/src/Processors/Sources/SourceWithProgress.h
+++ b/src/Processors/Sources/SourceWithProgress.h
@@ -2,6 +2,7 @@
 #include <Processors/ISource.h>
 #include <DataStreams/IBlockInputStream.h>
 #include <Common/Stopwatch.h>
+#include <DataStreams/LocalLimits.h>
 
 namespace DB
 {
@@ -13,9 +14,6 @@ class ISourceWithProgress : public ISource
 public:
     using ISource::ISource;
 
-    using LocalLimits = IBlockInputStream::LocalLimits;
-    using LimitsMode = IBlockInputStream::LimitsMode;
-
     /// Set limitations that checked on each chunk.
     virtual void setLimits(const LocalLimits & limits_) = 0;
 
@@ -47,9 +45,6 @@ public:
     /// If enable_auto_progress flag is set, progress() will be automatically called on each generated chunk.
     SourceWithProgress(Block header, bool enable_auto_progress);
 
-    using LocalLimits = IBlockInputStream::LocalLimits;
-    using LimitsMode = IBlockInputStream::LimitsMode;
-
     void setLimits(const LocalLimits & limits_) final { limits = limits_; }
     void setQuota(const std::shared_ptr<const EnabledQuota> & quota_) final { quota = quota_; }
     void setProcessListElement(QueryStatus * elem) final { process_list_elem = elem; }
diff --git a/src/Processors/Transforms/LimitsCheckingTransform.h b/src/Processors/Transforms/LimitsCheckingTransform.h
index 3014c259487..404a1320d55 100644
--- a/src/Processors/Transforms/LimitsCheckingTransform.h
+++ b/src/Processors/Transforms/LimitsCheckingTransform.h
@@ -4,7 +4,7 @@
 #include <Poco/Timespan.h>
 #include <Interpreters/ProcessList.h>
 
-#include <DataStreams/IBlockOutputStream.h>
+#include <DataStreams/LocalLimits.h>
 
 namespace DB
 {
@@ -26,9 +26,6 @@ class LimitsCheckingTransform : public ISimpleTransform
 {
 public:
 
-    using LocalLimits = IBlockInputStream::LocalLimits;
-    using LimitsMode = IBlockInputStream::LimitsMode;
-
     LimitsCheckingTransform(const Block & header_, LocalLimits limits_);
 
     String getName() const override { return "LimitsCheckingTransform"; }
diff --git a/src/Storages/IStorage.cpp b/src/Storages/IStorage.cpp
index 494b6a19c02..76033a93bf5 100644
--- a/src/Storages/IStorage.cpp
+++ b/src/Storages/IStorage.cpp
@@ -7,6 +7,7 @@
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTSetQuery.h>
 #include <Processors/Pipe.h>
+#include <Processors/QueryPlan/ReadFromStorageStep.h>
 #include <Interpreters/Context.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/quoteString.h>
@@ -91,6 +92,27 @@ Pipe IStorage::read(
     throw Exception("Method read is not supported by storage " + getName(), ErrorCodes::NOT_IMPLEMENTED);
 }
 
+void IStorage::read(
+        QueryPlan & query_plan,
+        TableLockHolder table_lock,
+        StorageMetadataPtr metadata_snapshot,
+        LocalLimits & limits,
+        std::shared_ptr<const EnabledQuota> quota,
+        const Names & column_names,
+        const SelectQueryInfo & query_info,
+        std::shared_ptr<Context> context,
+        QueryProcessingStage::Enum processed_stage,
+        size_t max_block_size,
+        unsigned num_streams)
+{
+    auto read_step = std::make_unique<ReadFromStorageStep>(
+            std::move(table_lock), std::move(metadata_snapshot), limits, std::move(quota), shared_from_this(),
+            column_names, query_info, std::move(context), processed_stage, max_block_size, num_streams);
+
+    read_step->setStepDescription("Read from " + getName());
+    query_plan.addStep(std::move(read_step));
+}
+
 Pipe IStorage::alterPartition(
     const ASTPtr & /* query */,
     const StorageMetadataPtr & /* metadata_snapshot */,
diff --git a/src/Storages/IStorage.h b/src/Storages/IStorage.h
index bdbb2eb9d80..0b770eed81b 100644
--- a/src/Storages/IStorage.h
+++ b/src/Storages/IStorage.h
@@ -48,6 +48,7 @@ using ProcessorPtr = std::shared_ptr<IProcessor>;
 using Processors = std::vector<ProcessorPtr>;
 
 class Pipe;
+class QueryPlan;
 
 class StoragePolicy;
 using StoragePolicyPtr = std::shared_ptr<const StoragePolicy>;
@@ -280,6 +281,19 @@ public:
         size_t /*max_block_size*/,
         unsigned /*num_streams*/);
 
+    virtual void read(
+        QueryPlan & query_plan,
+        TableLockHolder table_lock,
+        StorageMetadataPtr metadata_snapshot,
+        LocalLimits & limits,
+        std::shared_ptr<const EnabledQuota> quota,
+        const Names & column_names,
+        const SelectQueryInfo & query_info,
+        std::shared_ptr<Context> context,
+        QueryProcessingStage::Enum processed_stage,
+        size_t max_block_size,
+        unsigned num_streams);
+
     /** Writes the data to a table.
       * Receives a description of the query, which can contain information about the data write method.
       * Returns an object by which you can write data sequentially.
diff --git a/src/Storages/Kafka/StorageKafka.cpp b/src/Storages/Kafka/StorageKafka.cpp
index 1ee1f5de909..e35407bd6be 100644
--- a/src/Storages/Kafka/StorageKafka.cpp
+++ b/src/Storages/Kafka/StorageKafka.cpp
@@ -565,7 +565,7 @@ bool StorageKafka::streamToViews()
         streams.emplace_back(stream);
 
         // Limit read batch to maximum block size to allow DDL
-        IBlockInputStream::LocalLimits limits;
+        LocalLimits limits;
 
         limits.speed_limits.max_execution_time = kafka_settings->kafka_flush_interval_ms.changed
                                                  ? kafka_settings->kafka_flush_interval_ms
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index 29d1481ca50..0272d8b064d 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -752,7 +752,7 @@ bool StorageRabbitMQ::streamToViews()
         streams.emplace_back(stream);
 
         // Limit read batch to maximum block size to allow DDL
-        IBlockInputStream::LocalLimits limits;
+        LocalLimits limits;
 
         limits.speed_limits.max_execution_time = rabbitmq_settings->rabbitmq_flush_interval_ms.changed
                                                   ? rabbitmq_settings->rabbitmq_flush_interval_ms

From 765c8604c9eb0b7f44230b1717b72926d947edb2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 17:35:57 +0300
Subject: [PATCH 185/341] Inline GatherUtils algorithms.

---
 src/Functions/GatherUtils/Algorithms.h        | 20 +++++++++----------
 src/Functions/GatherUtils/concat.cpp          |  5 +++++
 src/Functions/GatherUtils/createArraySink.cpp |  5 +++++
 .../GatherUtils/createArraySource.cpp         |  5 +++++
 .../GatherUtils/createValueSource.cpp         |  5 +++++
 src/Functions/GatherUtils/has.cpp             |  4 ++++
 src/Functions/GatherUtils/push.cpp            |  4 ++++
 .../GatherUtils/resizeConstantSize.cpp        |  4 ++++
 .../GatherUtils/resizeDynamicSize.cpp         |  4 ++++
 .../GatherUtils/sliceDynamicOffsetBounded.cpp |  5 +++++
 .../sliceDynamicOffsetUnbounded.cpp           |  8 +++++++-
 .../sliceFromLeftConstantOffsetBounded.cpp    |  8 +++++++-
 .../sliceFromLeftConstantOffsetUnbounded.cpp  |  8 +++++++-
 .../sliceFromRightConstantOffsetBounded.cpp   |  8 +++++++-
 .../sliceFromRightConstantOffsetUnbounded.cpp |  8 +++++++-
 15 files changed, 86 insertions(+), 15 deletions(-)

diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index e54538c76b3..80093a06063 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -187,7 +187,7 @@ inline ALWAYS_INLINE void writeSlice(const NumericValueSlice<T> & slice, Generic
 
 
 template <typename SourceA, typename SourceB, typename Sink>
-void NO_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sink)
+void ALWAYS_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sink)
 {
     sink.reserve(src_a.getSizeForReserve() + src_b.getSizeForReserve());
 
@@ -251,7 +251,7 @@ void concat(const std::vector<std::unique_ptr<IArraySource>> & array_sources, Si
 }
 
 template <typename Sink>
-void NO_INLINE concat(StringSources & sources, Sink && sink)
+void ALWAYS_INLINE concat(StringSources & sources, Sink && sink)
 {
     while (!sink.isEnd())
     {
@@ -266,7 +266,7 @@ void NO_INLINE concat(StringSources & sources, Sink && sink)
 
 
 template <typename Source, typename Sink>
-void NO_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
+void ALWAYS_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
 {
     while (!src.isEnd())
     {
@@ -277,7 +277,7 @@ void NO_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Sink && sink,
 }
 
 template <typename Source, typename Sink>
-void NO_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
+void ALWAYS_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
 {
     while (!src.isEnd())
     {
@@ -294,7 +294,7 @@ void NO_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink && sink, s
 }
 
 template <typename Source, typename Sink>
-void NO_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
+void ALWAYS_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
 {
     while (!src.isEnd())
     {
@@ -305,7 +305,7 @@ void NO_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, Sink && sink
 }
 
 template <typename Source, typename Sink>
-void NO_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
+void ALWAYS_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
 {
     while (!src.isEnd())
     {
@@ -322,7 +322,7 @@ void NO_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sink && sink,
 }
 
 template <typename Source, typename Sink>
-void NO_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sink, const IColumn & offset_column)
+void ALWAYS_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sink, const IColumn & offset_column)
 {
     const bool is_null = offset_column.onlyNull();
     const auto * nullable = typeid_cast<const ColumnNullable *>(&offset_column);
@@ -353,7 +353,7 @@ void NO_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sink, const IC
 }
 
 template <typename Source, typename Sink>
-void NO_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink, const IColumn & offset_column, const IColumn & length_column)
+void ALWAYS_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink, const IColumn & offset_column, const IColumn & length_column)
 {
     const bool is_offset_null = offset_column.onlyNull();
     const auto * offset_nullable = typeid_cast<const ColumnNullable *>(&offset_column);
@@ -395,7 +395,7 @@ void NO_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink, const ICol
 
 
 template <typename SourceA, typename SourceB, typename Sink>
-void NO_INLINE conditional(SourceA && src_a, SourceB && src_b, Sink && sink, const PaddedPODArray<UInt8> & condition)
+void ALWAYS_INLINE conditional(SourceA && src_a, SourceB && src_b, Sink && sink, const PaddedPODArray<UInt8> & condition)
 {
     sink.reserve(std::max(src_a.getSizeForReserve(), src_b.getSizeForReserve()));
 
@@ -664,7 +664,7 @@ bool sliceHas(const NullableSlice<FirstArraySlice> & first, NullableSlice<Second
 }
 
 template <ArraySearchType search_type, typename FirstSource, typename SecondSource>
-void NO_INLINE arrayAllAny(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
+void ALWAYS_INLINE arrayAllAny(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
 {
     auto size = result.size();
     auto & data = result.getData();
diff --git a/src/Functions/GatherUtils/concat.cpp b/src/Functions/GatherUtils/concat.cpp
index 0962baed603..a878ae159d8 100644
--- a/src/Functions/GatherUtils/concat.cpp
+++ b/src/Functions/GatherUtils/concat.cpp
@@ -16,6 +16,9 @@ namespace ErrorCodes
 namespace GatherUtils
 {
 
+namespace
+{
+
 struct ArrayConcat : public ArraySinkSourceSelector<ArrayConcat>
 {
     using Sources = std::vector<std::unique_ptr<IArraySource>>;
@@ -42,6 +45,8 @@ struct ArrayConcat : public ArraySinkSourceSelector<ArrayConcat>
     }
 };
 
+}
+
 void concat(const std::vector<std::unique_ptr<IArraySource>> & sources, IArraySink & sink)
 {
     if (sources.empty())
diff --git a/src/Functions/GatherUtils/createArraySink.cpp b/src/Functions/GatherUtils/createArraySink.cpp
index 513fe112608..fbc9422155e 100644
--- a/src/Functions/GatherUtils/createArraySink.cpp
+++ b/src/Functions/GatherUtils/createArraySink.cpp
@@ -7,6 +7,9 @@ namespace DB::GatherUtils
 {
 /// Creates IArraySink from ColumnArray
 
+namespace
+{
+
 template <typename... Types>
 struct ArraySinkCreator;
 
@@ -39,6 +42,8 @@ struct ArraySinkCreator<>
     }
 };
 
+}
+
 std::unique_ptr<IArraySink> createArraySink(ColumnArray & col, size_t column_size)
 {
     using Creator = ApplyTypeListForClass<ArraySinkCreator, TypeListNumbersAndUInt128>::Type;
diff --git a/src/Functions/GatherUtils/createArraySource.cpp b/src/Functions/GatherUtils/createArraySource.cpp
index 93cace5304c..0744e2f2ea3 100644
--- a/src/Functions/GatherUtils/createArraySource.cpp
+++ b/src/Functions/GatherUtils/createArraySource.cpp
@@ -7,6 +7,9 @@ namespace DB::GatherUtils
 {
 /// Creates IArraySource from ColumnArray
 
+namespace
+{
+
 template <typename... Types>
 struct ArraySourceCreator;
 
@@ -51,6 +54,8 @@ struct ArraySourceCreator<>
     }
 };
 
+}
+
 std::unique_ptr<IArraySource> createArraySource(const ColumnArray & col, bool is_const, size_t total_rows)
 {
     using Creator = typename ApplyTypeListForClass<ArraySourceCreator, TypeListNumbersAndUInt128>::Type;
diff --git a/src/Functions/GatherUtils/createValueSource.cpp b/src/Functions/GatherUtils/createValueSource.cpp
index 02750869743..20110066214 100644
--- a/src/Functions/GatherUtils/createValueSource.cpp
+++ b/src/Functions/GatherUtils/createValueSource.cpp
@@ -7,6 +7,9 @@ namespace DB::GatherUtils
 {
 /// Creates IValueSource from Column
 
+namespace
+{
+
 template <typename... Types>
 struct ValueSourceCreator;
 
@@ -51,6 +54,8 @@ struct ValueSourceCreator<>
     }
 };
 
+}
+
 std::unique_ptr<IValueSource> createValueSource(const IColumn & col, bool is_const, size_t total_rows)
 {
     using Creator = typename ApplyTypeListForClass<ValueSourceCreator, TypeListNumbersAndUInt128>::Type;
diff --git a/src/Functions/GatherUtils/has.cpp b/src/Functions/GatherUtils/has.cpp
index d996a155e76..67aeb27a91f 100644
--- a/src/Functions/GatherUtils/has.cpp
+++ b/src/Functions/GatherUtils/has.cpp
@@ -5,6 +5,9 @@
 namespace DB::GatherUtils
 {
 
+namespace
+{
+
 struct ArrayHasSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
@@ -26,6 +29,7 @@ struct ArrayHasSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSe
     }
 };
 
+}
 
 void sliceHas(IArraySource & first, IArraySource & second, ArraySearchType search_type, ColumnUInt8 & result)
 {
diff --git a/src/Functions/GatherUtils/push.cpp b/src/Functions/GatherUtils/push.cpp
index 83a7851dbb0..c4b79948fa0 100644
--- a/src/Functions/GatherUtils/push.cpp
+++ b/src/Functions/GatherUtils/push.cpp
@@ -5,6 +5,9 @@
 namespace DB::GatherUtils
 {
 
+namespace
+{
+
 struct ArrayPush : public ArrayAndValueSourceSelectorBySink<ArrayPush>
 {
     template <typename ArraySource, typename ValueSource, typename Sink>
@@ -18,6 +21,7 @@ struct ArrayPush : public ArrayAndValueSourceSelectorBySink<ArrayPush>
     }
 };
 
+}
 
 void push(IArraySource & array_source, IValueSource & value_source, IArraySink & sink, bool push_front)
 {
diff --git a/src/Functions/GatherUtils/resizeConstantSize.cpp b/src/Functions/GatherUtils/resizeConstantSize.cpp
index e88e51e5231..f7c0d40b6d2 100644
--- a/src/Functions/GatherUtils/resizeConstantSize.cpp
+++ b/src/Functions/GatherUtils/resizeConstantSize.cpp
@@ -7,6 +7,9 @@
 namespace DB::GatherUtils
 {
 
+namespace
+{
+
 struct ArrayResizeConstant : public ArrayAndValueSourceSelectorBySink<ArrayResizeConstant>
 {
     template <typename ArraySource, typename ValueSource, typename Sink>
@@ -17,6 +20,7 @@ struct ArrayResizeConstant : public ArrayAndValueSourceSelectorBySink<ArrayResiz
     }
 };
 
+}
 
 void resizeConstantSize(IArraySource & array_source, IValueSource & value_source, IArraySink & sink, ssize_t size)
 {
diff --git a/src/Functions/GatherUtils/resizeDynamicSize.cpp b/src/Functions/GatherUtils/resizeDynamicSize.cpp
index 207f97d1290..c6578049ff9 100644
--- a/src/Functions/GatherUtils/resizeDynamicSize.cpp
+++ b/src/Functions/GatherUtils/resizeDynamicSize.cpp
@@ -7,6 +7,9 @@
 namespace DB::GatherUtils
 {
 
+namespace
+{
+
 struct ArrayResizeDynamic : public ArrayAndValueSourceSelectorBySink<ArrayResizeDynamic>
 {
     template <typename ArraySource, typename ValueSource, typename Sink>
@@ -17,6 +20,7 @@ struct ArrayResizeDynamic : public ArrayAndValueSourceSelectorBySink<ArrayResize
     }
 };
 
+}
 
 void resizeDynamicSize(IArraySource & array_source, IValueSource & value_source, IArraySink & sink, const IColumn & size_column)
 {
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
index e4ea70dd09e..1de7c31e0d8 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
@@ -4,6 +4,9 @@
 #include "Selectors.h"
 #include "Algorithms.h"
 
+namespace
+{
+
 namespace DB::GatherUtils
 {
 struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySinkSourceSelector<SliceDynamicOffsetBoundedSelectArraySource>
@@ -15,6 +18,8 @@ struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySinkSourceSelect
     }
 };
 
+}
+
 void sliceDynamicOffsetBounded(IArraySource & src, IArraySink & sink, const IColumn & offset_column, const IColumn & length_column)
 {
     SliceDynamicOffsetBoundedSelectArraySource::select(src, sink, offset_column, length_column);
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
index ba7d6835830..b8ef64e87ea 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
@@ -6,7 +6,12 @@
 
 namespace DB::GatherUtils
 {
-struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySinkSourceSelector<SliceDynamicOffsetUnboundedSelectArraySource>
+
+namespace
+{
+
+struct SliceDynamicOffsetUnboundedSelectArraySource
+        : public ArraySinkSourceSelector<SliceDynamicOffsetUnboundedSelectArraySource>
 {
     template <typename Source, typename Sink>
     static void selectSourceSink(Source && source, Sink && sink, const IColumn & offset_column)
@@ -15,6 +20,7 @@ struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySinkSourceSele
     }
 };
 
+}
 
 void sliceDynamicOffsetUnbounded(IArraySource & src, IArraySink & sink, const IColumn & offset_column)
 {
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
index d2f5082ad55..a667bea5f67 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
@@ -6,8 +6,12 @@
 
 namespace DB::GatherUtils
 {
+
+namespace
+{
+
 struct SliceFromLeftConstantOffsetBoundedSelectArraySource
-    : public ArraySinkSourceSelector<SliceFromLeftConstantOffsetBoundedSelectArraySource>
+        : public ArraySinkSourceSelector<SliceFromLeftConstantOffsetBoundedSelectArraySource>
 {
     template <typename Source, typename Sink>
     static void selectSourceSink(Source && source, Sink && sink, size_t & offset, ssize_t & length)
@@ -16,6 +20,8 @@ struct SliceFromLeftConstantOffsetBoundedSelectArraySource
     }
 };
 
+}
+
 void sliceFromLeftConstantOffsetBounded(IArraySource & src, IArraySink & sink, size_t offset, ssize_t length)
 {
     SliceFromLeftConstantOffsetBoundedSelectArraySource::select(src, sink, offset, length);
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
index 6f283d0dfec..8cdf6c91b60 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
@@ -6,8 +6,12 @@
 
 namespace DB::GatherUtils
 {
+
+namespace
+{
+
 struct SliceFromLeftConstantOffsetUnboundedSelectArraySource
-    : public ArraySinkSourceSelector<SliceFromLeftConstantOffsetUnboundedSelectArraySource>
+        : public ArraySinkSourceSelector<SliceFromLeftConstantOffsetUnboundedSelectArraySource>
 {
     template <typename Source, typename Sink>
     static void selectSourceSink(Source && source, Sink && sink, size_t & offset)
@@ -16,6 +20,8 @@ struct SliceFromLeftConstantOffsetUnboundedSelectArraySource
     }
 };
 
+}
+
 void sliceFromLeftConstantOffsetUnbounded(IArraySource & src, IArraySink & sink, size_t offset)
 {
     SliceFromLeftConstantOffsetUnboundedSelectArraySource::select(src, sink, offset);
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
index 1a6385924f4..cc61633d06b 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
@@ -6,8 +6,12 @@
 
 namespace DB::GatherUtils
 {
+
+namespace
+{
+
 struct SliceFromRightConstantOffsetBoundedSelectArraySource
-    : public ArraySinkSourceSelector<SliceFromRightConstantOffsetBoundedSelectArraySource>
+        : public ArraySinkSourceSelector<SliceFromRightConstantOffsetBoundedSelectArraySource>
 {
     template <typename Source, typename Sink>
     static void selectSourceSink(Source && source, Sink && sink, size_t & offset, ssize_t & length)
@@ -16,6 +20,8 @@ struct SliceFromRightConstantOffsetBoundedSelectArraySource
     }
 };
 
+}
+
 void sliceFromRightConstantOffsetBounded(IArraySource & src, IArraySink & sink, size_t offset, ssize_t length)
 {
     SliceFromRightConstantOffsetBoundedSelectArraySource::select(src, sink, offset, length);
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
index e669c5d50b8..d4d1caaaf58 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
@@ -6,8 +6,12 @@
 
 namespace DB::GatherUtils
 {
+
+namespace
+{
+
 struct SliceFromRightConstantOffsetUnboundedSelectArraySource
-    : public ArraySinkSourceSelector<SliceFromRightConstantOffsetUnboundedSelectArraySource>
+        : public ArraySinkSourceSelector<SliceFromRightConstantOffsetUnboundedSelectArraySource>
 {
     template <typename Source, typename Sink>
     static void selectSourceSink(Source && source, Sink && sink, size_t & offset)
@@ -16,6 +20,8 @@ struct SliceFromRightConstantOffsetUnboundedSelectArraySource
     }
 };
 
+}
+
 void sliceFromRightConstantOffsetUnbounded(IArraySource & src, IArraySink & sink, size_t offset)
 {
     SliceFromRightConstantOffsetUnboundedSelectArraySource::select(src, sink, offset);

From d2cd2775eb8921f3b3e214613bd3c622342928e6 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 17:44:08 +0300
Subject: [PATCH 186/341] Inline GatherUtils algorithms.

---
 src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
index 1de7c31e0d8..0b47aebfdd2 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
@@ -4,11 +4,12 @@
 #include "Selectors.h"
 #include "Algorithms.h"
 
+namespace DB::GatherUtils
+{
+
 namespace
 {
 
-namespace DB::GatherUtils
-{
 struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySinkSourceSelector<SliceDynamicOffsetBoundedSelectArraySource>
 {
     template <typename Source, typename Sink>

From c05021abc79bb6c04d80281d672b1b029e057106 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 18:11:15 +0300
Subject: [PATCH 187/341] Inline GatherUtils algorithms.

---
 src/Functions/GatherUtils/Algorithms.h | 42 +++++++++++++-------------
 1 file changed, 21 insertions(+), 21 deletions(-)

diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index 80093a06063..64380e5cd53 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -25,7 +25,7 @@ inline constexpr size_t MAX_ARRAY_SIZE = 1 << 30;
 /// Methods to copy Slice to Sink, overloaded for various combinations of types.
 
 template <typename T>
-void writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<T> & sink)
+void ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<T> & sink)
 {
     sink.elements.resize(sink.current_offset + slice.size);
     memcpySmallAllowReadWriteOverflow15(&sink.elements[sink.current_offset], slice.data, slice.size * sizeof(T));
@@ -33,7 +33,7 @@ void writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<T> & sink)
 }
 
 template <typename T, typename U>
-void writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<U> & sink)
+void ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<U> & sink)
 {
     using NativeU = typename NativeType<U>::Type;
 
@@ -146,7 +146,7 @@ inline ALWAYS_INLINE void writeSlice(const Slice & slice, NullableArraySink<Arra
 
 
 template <typename T, typename U>
-void writeSlice(const NumericValueSlice<T> & slice, NumericArraySink<U> & sink)
+void ALWAYS_INLINE writeSlice(const NumericValueSlice<T> & slice, NumericArraySink<U> & sink)
 {
     sink.elements.resize(sink.current_offset + 1);
     sink.elements[sink.current_offset] = slice.value;
@@ -203,7 +203,7 @@ void ALWAYS_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sink)
 }
 
 template <typename Source, typename Sink>
-void concat(const std::vector<std::unique_ptr<IArraySource>> & array_sources, Sink && sink)
+void ALWAYS_INLINE concat(const std::vector<std::unique_ptr<IArraySource>> & array_sources, Sink && sink)
 {
     size_t sources_num = array_sources.size();
     std::vector<char> is_const(sources_num);
@@ -423,7 +423,7 @@ template <
     typename FirstSliceType,
     typename SecondSliceType,
           bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t)>
-bool sliceHasImplAnyAll(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool ALWAYS_INLINE sliceHasImplAnyAll(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     const bool has_first_null_map = first_null_map != nullptr;
     const bool has_second_null_map = second_null_map != nullptr;
@@ -457,7 +457,7 @@ bool sliceHasImplAnyAll(const FirstSliceType & first, const SecondSliceType & se
 /// https://en.wikipedia.org/wiki/Knuth%E2%80%93Morris%E2%80%93Pratt_algorithm.
 /// A "prefix-function" is defined as: i-th element is the length of the longest of all prefixes that end in i-th position
 template <typename SliceType, typename EqualityFunc>
-std::vector<size_t> buildKMPPrefixFunction(const SliceType & pattern, const EqualityFunc & isEqualFunc)
+std::vector<size_t> ALWAYS_INLINE buildKMPPrefixFunction(const SliceType & pattern, const EqualityFunc & isEqualFunc)
 {
     std::vector<size_t> result(pattern.size);
     result[0] = 0;
@@ -484,7 +484,7 @@ template < typename FirstSliceType,
            typename SecondSliceType,
            bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t),
            bool (*isEqualUnary)(const SecondSliceType &, size_t, size_t)>
-bool sliceHasImplSubstr(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool ALWAYS_INLINE sliceHasImplSubstr(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     if (second.size == 0)
         return true;
@@ -541,7 +541,7 @@ template <
     typename SecondSliceType,
     bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t),
     bool (*isEqualSecond)(const SecondSliceType &, size_t, size_t)>
-bool sliceHasImpl(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool ALWAYS_INLINE sliceHasImpl(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     if constexpr (search_type == ArraySearchType::Substr)
         return sliceHasImplSubstr<FirstSliceType, SecondSliceType, isEqual, isEqualSecond>(first, second, first_null_map, second_null_map);
@@ -551,7 +551,7 @@ bool sliceHasImpl(const FirstSliceType & first, const SecondSliceType & second,
 
 
 template <typename T, typename U>
-bool sliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
+bool ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
                         const NumericArraySlice<U> & second [[maybe_unused]],
                         size_t first_ind [[maybe_unused]],
                         size_t second_ind [[maybe_unused]])
@@ -566,13 +566,13 @@ bool sliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
 }
 
 template <typename T>
-bool sliceEqualElements(const NumericArraySlice<T> &, const GenericArraySlice &, size_t, size_t)
+bool ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> &, const GenericArraySlice &, size_t, size_t)
 {
     return false;
 }
 
 template <typename U>
-bool sliceEqualElements(const GenericArraySlice &, const NumericArraySlice<U> &, size_t, size_t)
+bool ALWAYS_INLINE sliceEqualElements(const GenericArraySlice &, const NumericArraySlice<U> &, size_t, size_t)
 {
     return false;
 }
@@ -583,7 +583,7 @@ inline ALWAYS_INLINE bool sliceEqualElements(const GenericArraySlice & first, co
 }
 
 template <typename T>
-bool insliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
+bool ALWAYS_INLINE insliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
                           size_t first_ind [[maybe_unused]],
                           size_t second_ind [[maybe_unused]])
 {
@@ -598,14 +598,14 @@ inline ALWAYS_INLINE bool insliceEqualElements(const GenericArraySlice & first,
 }
 
 template <ArraySearchType search_type, typename T, typename U>
-bool sliceHas(const NumericArraySlice<T> & first, const NumericArraySlice<U> & second)
+bool ALWAYS_INLINE sliceHas(const NumericArraySlice<T> & first, const NumericArraySlice<U> & second)
 {
     auto impl = sliceHasImpl<search_type, NumericArraySlice<T>, NumericArraySlice<U>, sliceEqualElements<T, U>, insliceEqualElements<U>>;
     return impl(first, second, nullptr, nullptr);
 }
 
 template <ArraySearchType search_type>
-bool sliceHas(const GenericArraySlice & first, const GenericArraySlice & second)
+bool ALWAYS_INLINE sliceHas(const GenericArraySlice & first, const GenericArraySlice & second)
 {
     /// Generic arrays should have the same type in order to use column.compareAt(...)
     if (!first.elements->structureEquals(*second.elements))
@@ -616,19 +616,19 @@ bool sliceHas(const GenericArraySlice & first, const GenericArraySlice & second)
 }
 
 template <ArraySearchType search_type, typename U>
-bool sliceHas(const GenericArraySlice & /*first*/, const NumericArraySlice<U> & /*second*/)
+bool ALWAYS_INLINE sliceHas(const GenericArraySlice & /*first*/, const NumericArraySlice<U> & /*second*/)
 {
     return false;
 }
 
 template <ArraySearchType search_type, typename T>
-bool sliceHas(const NumericArraySlice<T> & /*first*/, const GenericArraySlice & /*second*/)
+bool ALWAYS_INLINE sliceHas(const NumericArraySlice<T> & /*first*/, const GenericArraySlice & /*second*/)
 {
     return false;
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool sliceHas(const FirstArraySlice & first, NullableSlice<SecondArraySlice> & second)
+bool ALWAYS_INLINE sliceHas(const FirstArraySlice & first, NullableSlice<SecondArraySlice> & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -640,7 +640,7 @@ bool sliceHas(const FirstArraySlice & first, NullableSlice<SecondArraySlice> & s
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool sliceHas(const NullableSlice<FirstArraySlice> & first, SecondArraySlice & second)
+bool ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, SecondArraySlice & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -652,7 +652,7 @@ bool sliceHas(const NullableSlice<FirstArraySlice> & first, SecondArraySlice & s
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool sliceHas(const NullableSlice<FirstArraySlice> & first, NullableSlice<SecondArraySlice> & second)
+bool ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, NullableSlice<SecondArraySlice> & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -677,7 +677,7 @@ void ALWAYS_INLINE arrayAllAny(FirstSource && first, SecondSource && second, Col
 }
 
 template <typename ArraySource, typename ValueSource, typename Sink>
-void resizeDynamicSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const IColumn & size_column)
+void ALWAYS_INLINE resizeDynamicSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const IColumn & size_column)
 {
     const auto * size_nullable = typeid_cast<const ColumnNullable *>(&size_column);
     const NullMap * size_null_map = size_nullable ? &size_nullable->getNullMapData() : nullptr;
@@ -736,7 +736,7 @@ void resizeDynamicSize(ArraySource && array_source, ValueSource && value_source,
 }
 
 template <typename ArraySource, typename ValueSource, typename Sink>
-void resizeConstantSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const ssize_t size)
+void ALWAYS_INLINE resizeConstantSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const ssize_t size)
 {
     while (!sink.isEnd())
     {

From fae21d7d098b32d5298fb4d72144d2032b0564c8 Mon Sep 17 00:00:00 2001
From: Ivan Blinkov <github@blinkov.ru>
Date: Mon, 14 Sep 2020 18:27:15 +0300
Subject: [PATCH 188/341] Update event links

---
 README.md | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index f14f2e88886..f1c8e17086b 100644
--- a/README.md
+++ b/README.md
@@ -15,6 +15,7 @@ ClickHouse is an open-source column-oriented database management system that all
 * [Contacts](https://clickhouse.tech/#contacts) can help to get your questions answered if there are any.
 * You can also [fill this form](https://clickhouse.tech/#meet) to meet Yandex ClickHouse team in person.
 
-## Upcoming Events		
+## Upcoming Events
 
-* [ClickHouse talk at Ya.Subbotnik (in Russian)](https://ya.cc/t/cIBI-3yECj5JF) on September 12, 2020.
+* [eBay migrating from Druid](https://us02web.zoom.us/webinar/register/tZMkfu6rpjItHtaQ1DXcgPWcSOnmM73HLGKL) on September 23, 2020.
+* [ClickHouse for Edge Analytics](https://ones2020.sched.com/event/bWPs) on September 29, 2020.

From 17a04cd62b2ad2adc6adfd3afbcb9a7750bcc5f0 Mon Sep 17 00:00:00 2001
From: yulu86 <xuyulu86@126.com>
Date: Mon, 14 Sep 2020 22:44:56 +0800
Subject: [PATCH 189/341] Optimize Chinese tutorial to make it more human
 readable

---
 docs/zh/getting-started/tutorial.md | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/docs/zh/getting-started/tutorial.md b/docs/zh/getting-started/tutorial.md
index 43c7ed0ec59..2a82911cce4 100644
--- a/docs/zh/getting-started/tutorial.md
+++ b/docs/zh/getting-started/tutorial.md
@@ -80,7 +80,7 @@ clickhouse-client --query='INSERT INTO table FORMAT TabSeparated' < data.tsv
 
 ## 导入示例数据集 {#import-sample-dataset}
 
-现在是时候用一些示例数据填充我们的ClickHouse服务器。 在本教程中，我们将使用Yandex的匿名数据。Metrica，在成为开源之前以生产方式运行ClickHouse的第一个服务（更多关于这一点 [历史科](../introduction/history.md)). 有 [多种导入Yandex的方式。梅里卡数据集](example-datasets/metrica.md)，为了本教程，我们将使用最现实的一个。
+现在是时候用一些示例数据填充我们的ClickHouse服务端。 在本教程中，我们将使用Yandex.Metrica的匿名数据，它是在ClickHouse成为开源之前作为生产环境运行的第一个服务（关于这一点的更多内容请参阅[ClickHouse历史](../introduction/history.md))。有 [多种导入Yandex.Metrica数据集的的方法](example-datasets/metrica.md)，为了本教程，我们将使用最现实的一个。
 
 ### 下载并提取表数据 {#download-and-extract-table-data}
 
@@ -93,22 +93,22 @@ curl https://clickhouse-datasets.s3.yandex.net/visits/tsv/visits_v1.tsv.xz | unx
 
 ### 创建表 {#create-tables}
 
-与大多数数据库管理系统一样，ClickHouse在逻辑上将表分组为 “databases”. 有一个 `default` 数据库，但我们将创建一个名为新的 `tutorial`:
+与大多数数据库管理系统一样，ClickHouse在逻辑上将表分组为数据库。包含一个 `default` 数据库，但我们将创建一个新的数据库 `tutorial`:
 
 ``` bash
 clickhouse-client --query "CREATE DATABASE IF NOT EXISTS tutorial"
 ```
 
-与数据库相比，创建表的语法要复杂得多（请参阅 [参考资料](../sql-reference/statements/create.md). 一般 `CREATE TABLE` 声明必须指定三个关键的事情:
+与创建数据库相比，创建表的语法要复杂得多（请参阅 [参考资料](../sql-reference/statements/create.md). 一般 `CREATE TABLE` 声明必须指定三个关键的事情:
 
 1.  要创建的表的名称。
-2.  Table schema, i.e. list of columns and their [数据类型](../sql-reference/data-types/index.md).
-3.  [表引擎](../engines/table-engines/index.md) 及其设置，这决定了如何物理执行对此表的查询的所有细节。
+2.  表结构，例如：列名和对应的[数据类型](../sql-reference/data-types/index.md)。
+3.  [表引擎](../engines/table-engines/index.md) 及其设置，这决定了对此表的查询操作是如何在物理层面执行的所有细节。
 
-YandexMetrica是一个网络分析服务，样本数据集不包括其全部功能，因此只有两个表可以创建:
+Yandex.Metrica是一个网络分析服务，样本数据集不包括其全部功能，因此只有两个表可以创建:
 
--   `hits` 是一个表格，其中包含所有用户在服务所涵盖的所有网站上完成的每个操作。
--   `visits` 是一个包含预先构建的会话而不是单个操作的表。
+-   `hits` 表包含所有用户在服务所涵盖的所有网站上完成的每个操作。
+-   `visits` 表包含预先构建的会话，而不是单个操作。
 
 让我们看看并执行这些表的实际创建表查询:
 
@@ -453,9 +453,9 @@ SAMPLE BY intHash32(UserID)
 SETTINGS index_granularity = 8192
 ```
 
-您可以使用以下交互模式执行这些查询 `clickhouse-client` （只需在终端中启动它，而不需要提前指定查询）或尝试一些 [替代接口](../interfaces/index.md) 如果你愿意的话
+您可以使用`clickhouse-client`的交互模式执行这些查询（只需在终端中启动它，而不需要提前指定查询）。或者如果你愿意，可以尝试一些[替代接口](../interfaces/index.md)。
 
-正如我们所看到的, `hits_v1` 使用 [基本MergeTree引擎](../engines/table-engines/mergetree-family/mergetree.md)，而 `visits_v1` 使用 [崩溃](../engines/table-engines/mergetree-family/collapsingmergetree.md) 变体。
+正如我们所看到的, `hits_v1` 使用 [基本的MergeTree引擎](../engines/table-engines/mergetree-family/mergetree.md)，而 `visits_v1` 使用 [折叠树](../engines/table-engines/mergetree-family/collapsingmergetree.md) 变体。
 
 ### 导入数据 {#import-data}
 

From 67b49862d939758d3c5e7ef72475deb9172a3e28 Mon Sep 17 00:00:00 2001
From: Ildus Kurbangaliev <i.kurbangaliev@gmail.com>
Date: Mon, 14 Sep 2020 18:11:50 +0200
Subject: [PATCH 190/341] Add mapPopulateSeries function (#13166)

---
 .../functions/tuple-map-functions.md          |  22 ++
 src/Functions/array/mapPopulateSeries.cpp     | 312 ++++++++++++++++++
 .../array/registerFunctionsArray.cpp          |   2 +
 src/Functions/ya.make                         |   1 +
 .../01318_map_populate_series.reference       |  49 +++
 .../0_stateless/01318_map_populate_series.sql |  36 ++
 6 files changed, 422 insertions(+)
 create mode 100644 src/Functions/array/mapPopulateSeries.cpp
 create mode 100644 tests/queries/0_stateless/01318_map_populate_series.reference
 create mode 100644 tests/queries/0_stateless/01318_map_populate_series.sql

diff --git a/docs/en/sql-reference/functions/tuple-map-functions.md b/docs/en/sql-reference/functions/tuple-map-functions.md
index 343f45135eb..f826b810d23 100644
--- a/docs/en/sql-reference/functions/tuple-map-functions.md
+++ b/docs/en/sql-reference/functions/tuple-map-functions.md
@@ -46,3 +46,25 @@ SELECT mapSubtract(([toUInt8(1), 2], [toInt32(1), 1]), ([toUInt8(1), 2], [toInt3
 │ ([1,2],[-1,0]) │ Tuple(Array(UInt8), Array(Int64)) │
 └────────────────┴───────────────────────────────────┘
 ````
+
+## mapPopulateSeries {#function-mappopulateseries}
+
+Syntax: `mapPopulateSeries((keys : Array(<IntegerType>), values : Array(<IntegerType>)[, max : <IntegerType>])`
+
+Generates a map, where keys are a series of numbers, from minimum to maximum keys (or `max` argument if it specified) taken from `keys` array with step size of one,
+and corresponding values taken from `values` array. If the value is not specified for the key, then it uses default value in the resulting map.
+For repeated keys only the first value (in order of appearing) gets associated with the key.
+
+The number of elements in `keys` and `values` must be the same for each row.
+
+Returns a tuple of two arrays: keys in sorted order, and values the corresponding keys.
+
+``` sql
+select mapPopulateSeries([1,2,4], [11,22,44], 5) as res, toTypeName(res) as type;
+```
+
+``` text
+┌─res──────────────────────────┬─type──────────────────────────────┐
+│ ([1,2,3,4,5],[11,22,0,44,0]) │ Tuple(Array(UInt8), Array(UInt8)) │
+└──────────────────────────────┴───────────────────────────────────┘
+```
diff --git a/src/Functions/array/mapPopulateSeries.cpp b/src/Functions/array/mapPopulateSeries.cpp
new file mode 100644
index 00000000000..19c48616a8b
--- /dev/null
+++ b/src/Functions/array/mapPopulateSeries.cpp
@@ -0,0 +1,312 @@
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnTuple.h>
+#include <Columns/ColumnVector.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeTuple.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <Functions/IFunction.h>
+#include "Core/ColumnWithTypeAndName.h"
+#include "DataTypes/IDataType.h"
+
+namespace DB
+{
+namespace ErrorCodes
+{
+    extern const int ILLEGAL_COLUMN;
+    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+}
+
+class FunctionMapPopulateSeries : public IFunction
+{
+public:
+    static constexpr auto name = "mapPopulateSeries";
+    static FunctionPtr create(const Context &) { return std::make_shared<FunctionMapPopulateSeries>(); }
+
+private:
+    String getName() const override { return name; }
+
+    size_t getNumberOfArguments() const override { return 0; }
+    bool isVariadic() const override { return true; }
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        if (arguments.size() < 2)
+            throw Exception{getName() + " accepts at least two arrays for key and value", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH};
+
+        if (arguments.size() > 3)
+            throw Exception{"too many arguments in " + getName() + " call", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH};
+
+        const DataTypeArray * key_array_type = checkAndGetDataType<DataTypeArray>(arguments[0].get());
+        const DataTypeArray * val_array_type = checkAndGetDataType<DataTypeArray>(arguments[1].get());
+
+        if (!key_array_type || !val_array_type)
+            throw Exception{getName() + " accepts two arrays for key and value", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT};
+
+        DataTypePtr keys_type = key_array_type->getNestedType();
+        WhichDataType which_key(keys_type);
+        if (!(which_key.isNativeInt() || which_key.isNativeUInt()))
+        {
+            throw Exception(
+                "Keys for " + getName() + " should be of native integer type (signed or unsigned)", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+        }
+
+        if (arguments.size() == 3)
+        {
+            DataTypePtr max_key_type = arguments[2];
+            WhichDataType which_max_key(max_key_type);
+
+            if (which_max_key.isNullable())
+                throw Exception(
+                    "Max key argument in arguments of function " + getName() + " can not be Nullable",
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+            if (keys_type->getTypeId() != max_key_type->getTypeId())
+                throw Exception("Max key type in " + getName() + " should be same as keys type", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+        }
+
+        return std::make_shared<DataTypeTuple>(DataTypes{arguments[0], arguments[1]});
+    }
+
+    template <typename KeyType, typename ValType>
+    void execute2(
+        Block & block, size_t result, ColumnPtr key_column, ColumnPtr val_column, ColumnPtr max_key_column, const DataTypeTuple & res_type)
+        const
+    {
+        MutableColumnPtr res_tuple = res_type.createColumn();
+
+        auto * to_tuple = assert_cast<ColumnTuple *>(res_tuple.get());
+        auto & to_keys_arr = assert_cast<ColumnArray &>(to_tuple->getColumn(0));
+        auto & to_keys_data = to_keys_arr.getData();
+        auto & to_keys_offsets = to_keys_arr.getOffsets();
+
+        auto & to_vals_arr = assert_cast<ColumnArray &>(to_tuple->getColumn(1));
+        auto & to_values_data = to_vals_arr.getData();
+
+        bool max_key_is_const = false, key_is_const = false, val_is_const = false;
+
+        const auto * keys_array = checkAndGetColumn<ColumnArray>(key_column.get());
+        if (!keys_array)
+        {
+            const ColumnConst * const_array = checkAndGetColumnConst<ColumnArray>(key_column.get());
+            if (!const_array)
+                throw Exception("Expected array column, found " + key_column->getName(), ErrorCodes::ILLEGAL_COLUMN);
+
+            keys_array = checkAndGetColumn<ColumnArray>(const_array->getDataColumnPtr().get());
+            key_is_const = true;
+        }
+
+        const auto * values_array = checkAndGetColumn<ColumnArray>(val_column.get());
+        if (!values_array)
+        {
+            const ColumnConst * const_array = checkAndGetColumnConst<ColumnArray>(val_column.get());
+            if (!const_array)
+                throw Exception("Expected array column, found " + val_column->getName(), ErrorCodes::ILLEGAL_COLUMN);
+
+            values_array = checkAndGetColumn<ColumnArray>(const_array->getDataColumnPtr().get());
+            val_is_const = true;
+        }
+
+        if (!keys_array || !values_array)
+            /* something went wrong */
+            throw Exception{"Illegal columns in arguments of function " + getName(), ErrorCodes::ILLEGAL_COLUMN};
+
+        KeyType max_key_const{0};
+
+        if (max_key_column && isColumnConst(*max_key_column))
+        {
+            const auto * column_const = static_cast<const ColumnConst *>(&*max_key_column);
+            max_key_const = column_const->template getValue<KeyType>();
+            max_key_is_const = true;
+        }
+
+        auto & keys_data = assert_cast<const ColumnVector<KeyType> &>(keys_array->getData()).getData();
+        auto & values_data = assert_cast<const ColumnVector<ValType> &>(values_array->getData()).getData();
+
+        // Original offsets
+        const IColumn::Offsets & key_offsets = keys_array->getOffsets();
+        const IColumn::Offsets & val_offsets = values_array->getOffsets();
+
+        IColumn::Offset offset{0};
+        size_t row_count = key_is_const ? values_array->size() : keys_array->size();
+
+        std::map<KeyType, ValType> res_map;
+
+        //Iterate through two arrays and fill result values.
+        for (size_t row = 0; row < row_count; ++row)
+        {
+            size_t key_offset = 0, val_offset = 0, array_size = key_offsets[0], val_array_size = val_offsets[0];
+
+            res_map.clear();
+
+            if (!key_is_const)
+            {
+                key_offset = row > 0 ? key_offsets[row - 1] : 0;
+                array_size = key_offsets[row] - key_offset;
+            }
+
+            if (!val_is_const)
+            {
+                val_offset = row > 0 ? val_offsets[row - 1] : 0;
+                val_array_size = val_offsets[row] - val_offset;
+            }
+
+            if (array_size != val_array_size)
+                throw Exception("Key and value array should have same amount of elements", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
+
+            if (array_size == 0)
+            {
+                to_keys_offsets.push_back(offset);
+                continue;
+            }
+
+            for (size_t i = 0; i < array_size; ++i)
+            {
+                res_map.insert({keys_data[key_offset + i], values_data[val_offset + i]});
+            }
+
+            auto min_key = res_map.begin()->first;
+            auto max_key = res_map.rbegin()->first;
+
+            if (max_key_column)
+            {
+                /* update the current max key if it's not constant */
+                if (max_key_is_const)
+                {
+                    max_key = max_key_const;
+                }
+                else
+                {
+                    max_key = (static_cast<const ColumnVector<KeyType> *>(max_key_column.get()))->getData()[row];
+                }
+
+                /* no need to add anything, max key is less that first key */
+                if (max_key < min_key)
+                {
+                    to_keys_offsets.push_back(offset);
+                    continue;
+                }
+            }
+
+            /* fill the result arrays */
+            KeyType key;
+            for (key = min_key; key <= max_key; ++key)
+            {
+                to_keys_data.insert(key);
+
+                auto it = res_map.find(key);
+                if (it != res_map.end())
+                {
+                    to_values_data.insert(it->second);
+                }
+                else
+                {
+                    to_values_data.insertDefault();
+                }
+
+                ++offset;
+            }
+
+            to_keys_offsets.push_back(offset);
+        }
+
+        to_vals_arr.getOffsets().insert(to_keys_offsets.begin(), to_keys_offsets.end());
+        block.getByPosition(result).column = std::move(res_tuple);
+    }
+
+    template <typename KeyType>
+    void execute1(
+        Block & block, size_t result, ColumnPtr key_column, ColumnPtr val_column, ColumnPtr max_key_column, const DataTypeTuple & res_type)
+        const
+    {
+        const auto & val_type = (assert_cast<const DataTypeArray *>(res_type.getElements()[1].get()))->getNestedType();
+        switch (val_type->getTypeId())
+        {
+            case TypeIndex::Int8:
+                execute2<KeyType, Int8>(block, result, key_column, val_column, max_key_column, res_type);
+                break;
+            case TypeIndex::Int16:
+                execute2<KeyType, Int16>(block, result, key_column, val_column, max_key_column, res_type);
+                break;
+            case TypeIndex::Int32:
+                execute2<KeyType, Int32>(block, result, key_column, val_column, max_key_column, res_type);
+                break;
+            case TypeIndex::Int64:
+                execute2<KeyType, Int64>(block, result, key_column, val_column, max_key_column, res_type);
+                break;
+            case TypeIndex::UInt8:
+                execute2<KeyType, UInt8>(block, result, key_column, val_column, max_key_column, res_type);
+                break;
+            case TypeIndex::UInt16:
+                execute2<KeyType, UInt16>(block, result, key_column, val_column, max_key_column, res_type);
+                break;
+            case TypeIndex::UInt32:
+                execute2<KeyType, UInt32>(block, result, key_column, val_column, max_key_column, res_type);
+                break;
+            case TypeIndex::UInt64:
+                execute2<KeyType, UInt64>(block, result, key_column, val_column, max_key_column, res_type);
+                break;
+            default:
+                throw Exception{"Illegal columns in arguments of function " + getName(), ErrorCodes::ILLEGAL_COLUMN};
+        }
+    }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t) const override
+    {
+        auto col1 = block.safeGetByPosition(arguments[0]), col2 = block.safeGetByPosition(arguments[1]);
+
+        const auto * k = assert_cast<const DataTypeArray *>(col1.type.get());
+        const auto * v = assert_cast<const DataTypeArray *>(col2.type.get());
+
+        /* determine output type */
+        const DataTypeTuple & res_type = DataTypeTuple(
+            DataTypes{std::make_shared<DataTypeArray>(k->getNestedType()), std::make_shared<DataTypeArray>(v->getNestedType())});
+
+        ColumnPtr max_key_column = nullptr;
+
+        if (arguments.size() == 3)
+        {
+            /* max key provided */
+            max_key_column = block.safeGetByPosition(arguments[2]).column;
+        }
+
+        switch (k->getNestedType()->getTypeId())
+        {
+            case TypeIndex::Int8:
+                execute1<Int8>(block, result, col1.column, col2.column, max_key_column, res_type);
+                break;
+            case TypeIndex::Int16:
+                execute1<Int16>(block, result, col1.column, col2.column, max_key_column, res_type);
+                break;
+            case TypeIndex::Int32:
+                execute1<Int32>(block, result, col1.column, col2.column, max_key_column, res_type);
+                break;
+            case TypeIndex::Int64:
+                execute1<Int64>(block, result, col1.column, col2.column, max_key_column, res_type);
+                break;
+            case TypeIndex::UInt8:
+                execute1<UInt8>(block, result, col1.column, col2.column, max_key_column, res_type);
+                break;
+            case TypeIndex::UInt16:
+                execute1<UInt16>(block, result, col1.column, col2.column, max_key_column, res_type);
+                break;
+            case TypeIndex::UInt32:
+                execute1<UInt32>(block, result, col1.column, col2.column, max_key_column, res_type);
+                break;
+            case TypeIndex::UInt64:
+                execute1<UInt64>(block, result, col1.column, col2.column, max_key_column, res_type);
+                break;
+            default:
+                throw Exception{"Illegal columns in arguments of function " + getName(), ErrorCodes::ILLEGAL_COLUMN};
+        }
+    }
+};
+
+void registerFunctionMapPopulateSeries(FunctionFactory & factory)
+{
+    factory.registerFunction<FunctionMapPopulateSeries>();
+}
+
+}
diff --git a/src/Functions/array/registerFunctionsArray.cpp b/src/Functions/array/registerFunctionsArray.cpp
index d10b65f77fd..3bb27cbadf9 100644
--- a/src/Functions/array/registerFunctionsArray.cpp
+++ b/src/Functions/array/registerFunctionsArray.cpp
@@ -36,6 +36,7 @@ void registerFunctionArrayZip(FunctionFactory &);
 void registerFunctionArrayAUC(FunctionFactory &);
 void registerFunctionArrayReduceInRanges(FunctionFactory &);
 void registerFunctionMapOp(FunctionFactory &);
+void registerFunctionMapPopulateSeries(FunctionFactory &);
 
 void registerFunctionsArray(FunctionFactory & factory)
 {
@@ -73,6 +74,7 @@ void registerFunctionsArray(FunctionFactory & factory)
     registerFunctionArrayZip(factory);
     registerFunctionArrayAUC(factory);
     registerFunctionMapOp(factory);
+    registerFunctionMapPopulateSeries(factory);
 }
 
 }
diff --git a/src/Functions/ya.make b/src/Functions/ya.make
index f48b4d607ed..388b140bf11 100644
--- a/src/Functions/ya.make
+++ b/src/Functions/ya.make
@@ -99,6 +99,7 @@ SRCS(
     array/indexOf.cpp
     array/length.cpp
     array/mapOp.cpp
+    array/mapPopulateSeries.cpp
     array/range.cpp
     array/registerFunctionsArray.cpp
     asin.cpp
diff --git a/tests/queries/0_stateless/01318_map_populate_series.reference b/tests/queries/0_stateless/01318_map_populate_series.reference
new file mode 100644
index 00000000000..2d83844c8e1
--- /dev/null
+++ b/tests/queries/0_stateless/01318_map_populate_series.reference
@@ -0,0 +1,49 @@
+([1],[1])
+([1,2],[1,2])
+([1,2,3],[1,0,2])
+([1,2,3,4],[1,0,0,2])
+([1,2,3,4,5],[1,0,0,0,2])
+([1,2,3],[1,0,0])
+([1,2,3],[1,2,0])
+([1,2,3],[1,0,2])
+([1,2,3],[1,0,0])
+([1,2,3],[1,0,0])
+([1,2,3,4,5,6,7,8,9,10],[1,0,0,0,0,0,0,0,0,0])
+([1,2,3,4,5,6,7,8,9,10],[1,2,0,0,0,0,0,0,0,0])
+([1,2,3,4,5,6,7,8,9,10],[1,0,2,0,0,0,0,0,0,0])
+([1,2,3,4,5,6,7,8,9,10],[1,0,0,2,0,0,0,0,0,0])
+([1,2,3,4,5,6,7,8,9,10],[1,0,0,0,2,0,0,0,0,0])
+([1,2],[1,0])
+([1,2,3],[1,2,0])
+([1,2,3,4],[1,0,2,0])
+([1,2,3,4,5],[1,0,0,2,0])
+([1,2,3,4,5,6],[1,0,0,0,2,0])
+([1],[11])
+([1,2],[11,22])
+([1,2,3],[11,0,22])
+([1,2,3,4],[11,0,0,22])
+([1,2,3,4,5],[11,0,0,0,22])
+([3,4],[1,2])
+([3,4],[1,2])
+([3,4],[1,2])
+([3,4],[1,2])
+([3,4],[1,2])
+([],[])
+([3],[1])
+([3,4],[1,2])
+([3,4,5],[1,2,0])
+([3,4,5,6],[1,2,0,0])
+([1,2],[1,1])	Tuple(Array(UInt8), Array(UInt8))
+([1,2],[1,1])	Tuple(Array(UInt16), Array(UInt16))
+([1,2],[1,1])	Tuple(Array(UInt32), Array(UInt32))
+([1,2],[1,1])	Tuple(Array(UInt64), Array(UInt64))
+([1,2],[1,1])	Tuple(Array(Int16), Array(Int16))
+([1,2],[1,1])	Tuple(Array(Int16), Array(Int16))
+([1,2],[1,1])	Tuple(Array(Int32), Array(Int32))
+([1,2],[1,1])	Tuple(Array(Int64), Array(Int64))
+([-10,-9,-8,-7,-6,-5,-4,-3,-2,-1,0,1,2],[1,0,0,0,0,0,0,0,0,0,0,0,1])	Tuple(Array(Int16), Array(Int16))
+([-10,-9,-8,-7,-6,-5,-4,-3,-2,-1,0,1,2],[1,0,0,0,0,0,0,0,0,0,0,0,1])	Tuple(Array(Int16), Array(Int16))
+([-10,-9,-8,-7,-6,-5,-4,-3,-2,-1,0,1,2],[1,0,0,0,0,0,0,0,0,0,0,0,1])	Tuple(Array(Int32), Array(Int32))
+([-10,-9,-8,-7,-6,-5,-4,-3,-2,-1,0,1,2],[1,0,0,0,0,0,0,0,0,0,0,0,1])	Tuple(Array(Int64), Array(Int64))
+([-10,-9,-8,-7,-6,-5],[1,0,0,0,0,0])	Tuple(Array(Int64), Array(Int64))
+([],[])
diff --git a/tests/queries/0_stateless/01318_map_populate_series.sql b/tests/queries/0_stateless/01318_map_populate_series.sql
new file mode 100644
index 00000000000..e52571182fe
--- /dev/null
+++ b/tests/queries/0_stateless/01318_map_populate_series.sql
@@ -0,0 +1,36 @@
+drop table if exists map_test;
+create table map_test engine=TinyLog() as (select (number + 1) as n, ([1, number], [1,2]) as map from numbers(1, 5));
+
+select mapPopulateSeries(map.1, map.2) from map_test;
+select mapPopulateSeries(map.1, map.2, toUInt64(3)) from map_test;
+select mapPopulateSeries(map.1, map.2, toUInt64(10)) from map_test;
+select mapPopulateSeries(map.1, map.2, 1000) from map_test; -- { serverError 43 }
+select mapPopulateSeries(map.1, map.2, n) from map_test;
+select mapPopulateSeries(map.1, [11,22]) from map_test;
+select mapPopulateSeries([3, 4], map.2) from map_test;
+select mapPopulateSeries([toUInt64(3), 4], map.2, n) from map_test;
+
+drop table map_test;
+
+select mapPopulateSeries([toUInt8(1), 2], [toUInt8(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toUInt16(1), 2], [toUInt16(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toUInt32(1), 2], [toUInt32(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toUInt64(1), 2], [toUInt64(1), 1]) as res, toTypeName(res);
+
+select mapPopulateSeries([toInt8(1), 2], [toInt8(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toInt16(1), 2], [toInt16(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toInt32(1), 2], [toInt32(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toInt64(1), 2], [toInt64(1), 1]) as res, toTypeName(res);
+
+select mapPopulateSeries([toInt8(-10), 2], [toInt8(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toInt16(-10), 2], [toInt16(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toInt32(-10), 2], [toInt32(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toInt64(-10), 2], [toInt64(1), 1]) as res, toTypeName(res);
+select mapPopulateSeries([toInt64(-10), 2], [toInt64(1), 1], toInt64(-5)) as res, toTypeName(res);
+
+-- empty
+select mapPopulateSeries(cast([], 'Array(UInt8)'), cast([], 'Array(UInt8)'), 5);
+
+select mapPopulateSeries(['1', '2'], [1,1]) as res, toTypeName(res); -- { serverError 43 }
+select mapPopulateSeries([1, 2, 3], [1,1]) as res, toTypeName(res); -- { serverError 42 }
+select mapPopulateSeries([1, 2], [1,1,1]) as res, toTypeName(res); -- { serverError 42 }

From b3138605c7964b621ac26855c7c4a070f533d186 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Mon, 14 Sep 2020 19:16:38 +0300
Subject: [PATCH 191/341] performance comparison

---
 docker/test/performance-comparison/compare.sh | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index 08f4cb599ab..32ea74193b0 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -927,13 +927,15 @@ done
 
 function report_metrics
 {
+build_log_column_definitions
+
 rm -rf metrics ||:
 mkdir metrics
 
 clickhouse-local --query "
 create view right_async_metric_log as
     select * from file('right-async-metric-log.tsv', TSVWithNamesAndTypes,
-        'event_date Date, event_time DateTime, name String, value Float64')
+        '$(cat right-async-metric-log.tsv.columns)')
     ;
 
 -- Use the right log as time reference because it may have higher precision.
@@ -942,7 +944,7 @@ create table metrics engine File(TSV, 'metrics/metrics.tsv') as
     select name metric, r.event_time - min_time event_time, l.value as left, r.value as right
     from right_async_metric_log r
     asof join file('left-async-metric-log.tsv', TSVWithNamesAndTypes,
-        'event_date Date, event_time DateTime, name String, value Float64') l
+        '$(cat left-async-metric-log.tsv.columns)') l
     on l.name = r.name and r.event_time <= l.event_time
     order by metric, event_time
     ;

From 08d4e965299d8f3de0c12d6528dca07c41047d5f Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 19:37:35 +0300
Subject: [PATCH 192/341] GatherUtils visibility.

---
 src/Functions/GatherUtils/ArraySinkVisitor.h   | 2 ++
 src/Functions/GatherUtils/ArraySourceVisitor.h | 2 ++
 src/Functions/GatherUtils/IArraySink.h         | 2 ++
 src/Functions/GatherUtils/IArraySource.h       | 2 ++
 src/Functions/GatherUtils/IValueSource.h       | 2 ++
 src/Functions/GatherUtils/Selectors.h          | 2 ++
 src/Functions/GatherUtils/Sinks.h              | 3 ++-
 src/Functions/GatherUtils/Slices.h             | 2 ++
 src/Functions/GatherUtils/Sources.h            | 2 ++
 src/Functions/GatherUtils/ValueSourceVisitor.h | 2 ++
 10 files changed, 20 insertions(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/ArraySinkVisitor.h b/src/Functions/GatherUtils/ArraySinkVisitor.h
index 6d4028a5e01..1109b40f5da 100644
--- a/src/Functions/GatherUtils/ArraySinkVisitor.h
+++ b/src/Functions/GatherUtils/ArraySinkVisitor.h
@@ -4,6 +4,7 @@
 
 namespace DB::GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 template <typename T>
 struct NumericArraySink;
@@ -23,4 +24,5 @@ class ArraySinkVisitor : public ApplyTypeListForClass<Visitor, TypeListArraySink
 template <typename Derived>
 class ArraySinkVisitorImpl : public VisitorImpl<Derived, ArraySinkVisitor> {};
 
+#pragma GCC visibility pop
 }
diff --git a/src/Functions/GatherUtils/ArraySourceVisitor.h b/src/Functions/GatherUtils/ArraySourceVisitor.h
index a8cd8c62cba..98f7338ee12 100644
--- a/src/Functions/GatherUtils/ArraySourceVisitor.h
+++ b/src/Functions/GatherUtils/ArraySourceVisitor.h
@@ -4,6 +4,7 @@
 
 namespace DB::GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 template <typename T>
 struct NumericArraySource;
@@ -28,4 +29,5 @@ class ArraySourceVisitor : public ApplyTypeListForClass<Visitor, TypeListArraySo
 template <typename Derived>
 class ArraySourceVisitorImpl : public VisitorImpl<Derived, ArraySourceVisitor> {};
 
+#pragma GCC visibility pop
 }
diff --git a/src/Functions/GatherUtils/IArraySink.h b/src/Functions/GatherUtils/IArraySink.h
index 25789f2ce45..a41d99b5f6a 100644
--- a/src/Functions/GatherUtils/IArraySink.h
+++ b/src/Functions/GatherUtils/IArraySink.h
@@ -13,6 +13,7 @@ namespace ErrorCodes
 
 namespace GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 struct IArraySink
 {
@@ -27,6 +28,7 @@ struct IArraySink
 template <typename Derived>
 class ArraySinkImpl : public Visitable<Derived, IArraySink, ArraySinkVisitor> {};
 
+#pragma GCC visibility pop
 }
 
 }
diff --git a/src/Functions/GatherUtils/IArraySource.h b/src/Functions/GatherUtils/IArraySource.h
index b8f4e6734e7..e704237b304 100644
--- a/src/Functions/GatherUtils/IArraySource.h
+++ b/src/Functions/GatherUtils/IArraySource.h
@@ -13,6 +13,7 @@ namespace ErrorCodes
 
 namespace GatherUtils
 {
+#pragma GCC visibility pop
 
 struct IArraySource
 {
@@ -33,6 +34,7 @@ struct IArraySource
 template <typename Derived>
 class ArraySourceImpl : public Visitable<Derived, IArraySource, ArraySourceVisitor> {};
 
+#pragma GCC visibility pop
 }
 
 }
diff --git a/src/Functions/GatherUtils/IValueSource.h b/src/Functions/GatherUtils/IValueSource.h
index a5b1ce869e1..55af364a3a9 100644
--- a/src/Functions/GatherUtils/IValueSource.h
+++ b/src/Functions/GatherUtils/IValueSource.h
@@ -13,6 +13,7 @@ namespace ErrorCodes
 
 namespace GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 struct IValueSource
 {
@@ -29,6 +30,7 @@ struct IValueSource
 template <typename Derived>
 class ValueSourceImpl : public Visitable<Derived, IValueSource, ValueSourceVisitor> {};
 
+#pragma GCC visibility pop
 }
 
 }
diff --git a/src/Functions/GatherUtils/Selectors.h b/src/Functions/GatherUtils/Selectors.h
index 3d9ee3f00b8..4b32735b6a1 100644
--- a/src/Functions/GatherUtils/Selectors.h
+++ b/src/Functions/GatherUtils/Selectors.h
@@ -17,6 +17,7 @@ namespace ErrorCodes
 
 namespace GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 /// Base classes which selects template function implementation with concrete ArraySource or ArraySink
 /// Derived classes should implement selectImpl for ArraySourceSelector and ArraySinkSelector,
@@ -201,6 +202,7 @@ struct ArrayAndValueSourceSelectorBySink : public ArraySinkSelector<ArrayAndValu
     }
 };
 
+#pragma GCC visibility pop
 }
 
 }
diff --git a/src/Functions/GatherUtils/Sinks.h b/src/Functions/GatherUtils/Sinks.h
index 5fd943ae78b..0ada47ede1d 100644
--- a/src/Functions/GatherUtils/Sinks.h
+++ b/src/Functions/GatherUtils/Sinks.h
@@ -14,6 +14,7 @@
 
 namespace DB::GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 template <typename T>
 struct NumericArraySource;
@@ -212,5 +213,5 @@ struct NullableArraySink : public ArraySink
     }
 };
 
-
+#pragma GCC visibility pop
 }
diff --git a/src/Functions/GatherUtils/Slices.h b/src/Functions/GatherUtils/Slices.h
index 762ebf3b579..7951178497a 100644
--- a/src/Functions/GatherUtils/Slices.h
+++ b/src/Functions/GatherUtils/Slices.h
@@ -4,6 +4,7 @@
 
 namespace DB::GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 template <typename T>
 struct NumericArraySlice
@@ -42,5 +43,6 @@ struct GenericValueSlice
     static constexpr size_t size = 1;
 };
 
+#pragma GCC visibility pop
 }
 
diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 299884e1c9e..bd69a30ebfc 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -28,6 +28,7 @@ namespace ErrorCodes
 
 namespace GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 template <typename T>
 struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
@@ -775,4 +776,5 @@ struct NullableValueSource : public ValueSource
 
 }
 
+#pragma GCC visibility pop
 }
diff --git a/src/Functions/GatherUtils/ValueSourceVisitor.h b/src/Functions/GatherUtils/ValueSourceVisitor.h
index 6cb6f75ef26..63f94ea29e3 100644
--- a/src/Functions/GatherUtils/ValueSourceVisitor.h
+++ b/src/Functions/GatherUtils/ValueSourceVisitor.h
@@ -4,6 +4,7 @@
 
 namespace DB::GatherUtils
 {
+#pragma GCC visibility push(hidden)
 
 template <typename T>
 struct NumericValueSource;
@@ -28,4 +29,5 @@ class ValueSourceVisitor : public ApplyTypeListForClass<Visitor, TypeListValueSo
 template <typename Derived>
 class ValueSourceVisitorImpl : public VisitorImpl<Derived, ValueSourceVisitor> {};
 
+#pragma GCC visibility pop
 }

From d4542a352c56896b2c0dee6c2af0aa3cdade479c Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 19:40:04 +0300
Subject: [PATCH 193/341] GatherUtils visibility.

---
 src/Functions/GatherUtils/IArraySource.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/IArraySource.h b/src/Functions/GatherUtils/IArraySource.h
index e704237b304..386108f038e 100644
--- a/src/Functions/GatherUtils/IArraySource.h
+++ b/src/Functions/GatherUtils/IArraySource.h
@@ -13,7 +13,7 @@ namespace ErrorCodes
 
 namespace GatherUtils
 {
-#pragma GCC visibility pop
+#pragma GCC visibility push(hidden)
 
 struct IArraySource
 {

From 038ae021265150d353f84373fced4e5f98ecdd17 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 20:24:55 +0300
Subject: [PATCH 194/341] Fix for #14761, part 2

---
 src/Functions/GatherUtils/CMakeLists.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/GatherUtils/CMakeLists.txt b/src/Functions/GatherUtils/CMakeLists.txt
index b9b9a981110..7f946931c9a 100644
--- a/src/Functions/GatherUtils/CMakeLists.txt
+++ b/src/Functions/GatherUtils/CMakeLists.txt
@@ -7,11 +7,11 @@ check_cxx_compiler_flag("-Wsuggest-override" HAS_SUGGEST_OVERRIDE)
 check_cxx_compiler_flag("-Wsuggest-destructor-override" HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
 
 if (HAS_SUGGEST_OVERRIDE)
-    target_compile_definitions(clickhouse_functions_gatherutils PRIVATE HAS_SUGGEST_OVERRIDE)
+    target_compile_definitions(clickhouse_functions_gatherutils PUBLIC HAS_SUGGEST_OVERRIDE)
 endif()
 
 if (HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
-    target_compile_definitions(clickhouse_functions_gatherutils PRIVATE HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
+    target_compile_definitions(clickhouse_functions_gatherutils PUBLIC HAS_SUGGEST_DESTRUCTOR_OVERRIDE)
 endif()
 
 if (STRIP_DEBUG_SYMBOLS_FUNCTIONS)

From ab6bc1ed59449a200e1ea9c0fe96beb7a3fc4fd7 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <36882414+akuzm@users.noreply.github.com>
Date: Mon, 14 Sep 2020 20:25:17 +0300
Subject: [PATCH 195/341] Update compare.sh

---
 docker/test/performance-comparison/compare.sh | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index 0b678024765..db4939d529d 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -198,12 +198,13 @@ function run_tests
         echo test "$test_name"
 
         TIMEFORMAT=$(printf "$test_name\t%%3R\t%%3U\t%%3S\n")
-        # the grep is to filter out set -x output and keep only time output
+        # The grep is to filter out set -x output and keep only time output.
+        # The '2>&1 >/dev/null' redirects stderr to stdout, and discards stdout.
         { \
             time "$script_dir/perf.py" --host localhost localhost --port 9001 9002 \
                 --runs "$CHPC_RUNS" --max-queries "$CHPC_MAX_QUERIES" \
                 -- "$test" > "$test_name-raw.tsv" 2> "$test_name-err.log" ; \
-        } 2>&1 >/dev/null | grep -v ^+ >> "wall-clock-times.tsv" \
+        } 2>&1 >/dev/null | tee >(grep -v ^+ >> "wall-clock-times.tsv") \
             || echo "Test $test_name failed with error code $?" >> "$test_name-err.log"
     done
 

From f9361acb88440abb1cebcf31868ccb43cb312629 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 21:00:45 +0300
Subject: [PATCH 196/341] Disable in shared libraries mode

---
 src/CMakeLists.txt             | 4 ++++
 src/Common/remapExecutable.cpp | 2 +-
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index 843dd8c2615..b6e8c395b26 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -117,6 +117,10 @@ endif ()
 
 add_library(clickhouse_common_io ${clickhouse_common_io_headers} ${clickhouse_common_io_sources})
 
+if (SPLIT_SHARED_LIBRARIES)
+    target_compile_definitions(clickhouse_common_io PRIVATE SPLIT_SHARED_LIBRARIES)
+endif ()
+
 add_library (clickhouse_malloc OBJECT Common/malloc.cpp)
 set_source_files_properties(Common/malloc.cpp PROPERTIES COMPILE_FLAGS "-fno-builtin")
 
diff --git a/src/Common/remapExecutable.cpp b/src/Common/remapExecutable.cpp
index 3e9d1ebc710..97e0823deda 100644
--- a/src/Common/remapExecutable.cpp
+++ b/src/Common/remapExecutable.cpp
@@ -1,4 +1,4 @@
-#if defined(__linux__) && defined(__amd64__) && defined(__SSE2__) && !defined(SANITIZER) && defined(NDEBUG)
+#if defined(__linux__) && defined(__amd64__) && defined(__SSE2__) && !defined(SANITIZER) && defined(NDEBUG) && !defined(SPLIT_SHARED_LIBRARIES)
 
 #include <sys/mman.h>
 #include <unistd.h>

From 2ac88ab47d1d62a0e6fb8605dfa70b42b52232d2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 21:08:09 +0300
Subject: [PATCH 197/341] Added config option

---
 programs/server/Server.cpp | 8 +++++---
 programs/server/config.xml | 3 +++
 2 files changed, 8 insertions(+), 3 deletions(-)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 8149623ffce..56778b8dd69 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -306,13 +306,15 @@ int Server::main(const std::vector<std::string> & /*args*/)
 
     /// After full config loaded
     {
-        if (config().getBool("mlock_executable", false))
+        if (config().getBool("remap_executable", false))
         {
             LOG_DEBUG(log, "Will remap executable in memory.");
             remapExecutable();
             LOG_DEBUG(log, "The code in memory has been successfully remapped.");
+        }
 
-/*
+        if (config().getBool("mlock_executable", false))
+        {
             if (hasLinuxCapability(CAP_IPC_LOCK))
             {
                 LOG_TRACE(log, "Will mlockall to prevent executable memory from being paged out. It may take a few seconds.");
@@ -327,7 +329,7 @@ int Server::main(const std::vector<std::string> & /*args*/)
                     " It could happen due to incorrect ClickHouse package installation."
                     " You could resolve the problem manually with 'sudo setcap cap_ipc_lock=+ep {}'."
                     " Note that it will not work on 'nosuid' mounted filesystems.", executable_path);
-            }*/
+            }
         }
     }
 #endif
diff --git a/programs/server/config.xml b/programs/server/config.xml
index 3d7ebf0cd96..77b59abd891 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -302,6 +302,9 @@
     -->
     <mlock_executable>true</mlock_executable>
 
+    <!-- Reallocate memory for machine code ("text") using huge pages. Highly experimental. -->
+    <remap_executable>false</remap_executable>
+
     <!-- Configuration of clusters that could be used in Distributed tables.
          https://clickhouse.tech/docs/en/operations/table_engines/distributed/
       -->

From 3530f83c0155a8cfc96da146a23515709db8bb67 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 21:12:09 +0300
Subject: [PATCH 198/341] Remove debug output

---
 src/Common/remapExecutable.cpp | 10 ----------
 1 file changed, 10 deletions(-)

diff --git a/src/Common/remapExecutable.cpp b/src/Common/remapExecutable.cpp
index 97e0823deda..13bce459022 100644
--- a/src/Common/remapExecutable.cpp
+++ b/src/Common/remapExecutable.cpp
@@ -115,26 +115,19 @@ __attribute__((__noinline__)) void remapToHugeStep2(void * begin, size_t size, v
     int64_t offset = reinterpret_cast<intptr_t>(scratch) - reinterpret_cast<intptr_t>(begin);
     int64_t (*syscall_func)(...) = reinterpret_cast<int64_t (*)(...)>(reinterpret_cast<intptr_t>(our_syscall) + offset);
 
-    //char dot = '.';
-    //syscall_func(SYS_write, 2, &dot, 1);
-
     int64_t munmap_res = syscall_func(SYS_munmap, begin, size);
     if (munmap_res != 0)
         return;
 
-    //syscall_func(SYS_write, 2, &dot, 1);
-
     /// Map new anonymous memory region in place of old region with code.
 
     int64_t mmap_res = syscall_func(SYS_mmap, begin, size, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS | MAP_FIXED, -1, 0);
     if (-1 == mmap_res)
         syscall_func(SYS_exit, 1);
-    //syscall_func(SYS_write, 2, &dot, 1);
 
     /// As the memory region is anonymous, we can do madvise with MADV_HUGEPAGE.
 
     syscall_func(SYS_madvise, begin, size, MADV_HUGEPAGE);
-    //syscall_func(SYS_write, 2, &dot, 1);
 
     /// Copy the code from scratch area to the old memory location.
 
@@ -151,12 +144,9 @@ __attribute__((__noinline__)) void remapToHugeStep2(void * begin, size_t size, v
         }
     }
 
-    //syscall_func(SYS_write, 2, &dot, 1);
-
     /// Make the memory area with the code executable and non-writable.
 
     syscall_func(SYS_mprotect, begin, size, PROT_READ | PROT_EXEC);
-    //syscall_func(SYS_write, 2, &dot, 1);
 
     /** Step 3 function should unmap the scratch area.
       * The currently executed code is located in the scratch area and cannot be removed here.

From b87c108246222586c503030a5de15e678eadb9ba Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 21:14:28 +0300
Subject: [PATCH 199/341] Enable remap in performance tests

---
 .../config/config.d/perf-comparison-tweaks-config.xml         | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/docker/test/performance-comparison/config/config.d/perf-comparison-tweaks-config.xml b/docker/test/performance-comparison/config/config.d/perf-comparison-tweaks-config.xml
index 6f1726ab36b..bc7ddf1fbbb 100644
--- a/docker/test/performance-comparison/config/config.d/perf-comparison-tweaks-config.xml
+++ b/docker/test/performance-comparison/config/config.d/perf-comparison-tweaks-config.xml
@@ -1,4 +1,4 @@
-<yandex> 
+<yandex>
     <http_port remove="remove"/>
     <mysql_port remove="remove"/>
     <interserver_http_port remove="remove"/>
@@ -22,4 +22,6 @@
     <uncompressed_cache_size>1000000000</uncompressed_cache_size>
 
     <asynchronous_metrics_update_period_s>10</asynchronous_metrics_update_period_s>
+
+    <remap_executable replace="replace">true</remap_executable>
 </yandex>

From 2e13e8e83696042e55146c715224e82b50621b9f Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 21:19:30 +0300
Subject: [PATCH 200/341] Update CHANGELOG.md

---
 CHANGELOG.md | 24 +++++++++++++-----------
 1 file changed, 13 insertions(+), 11 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 23107434024..6b30395e859 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -10,29 +10,26 @@
 
 #### New Feature
 
-* Add `countDigits(x)` function that count number of decimal digits in integer or decimal column. Add `isDecimalOverflow(d, [p])` function that checks if the value in Decimal column is out of its (or specified) precision. [#14151](https://github.com/ClickHouse/ClickHouse/pull/14151) ([Artem Zuikov](https://github.com/4ertus2)).
-* Add setting `min_index_granularity_bytes` that protects against accidentally creating a table with very low `index_granularity_bytes` setting. [#14139](https://github.com/ClickHouse/ClickHouse/pull/14139) ([Bharat Nallan](https://github.com/bharatnc)).
+* ClickHouse can work as MySQL replica - it is implemented by `MaterializeMySQL` database engine. Implements [#4006](https://github.com/ClickHouse/ClickHouse/issues/4006). [#10851](https://github.com/ClickHouse/ClickHouse/pull/10851) ([Winter Zhang](https://github.com/zhang2014)).
 * Add the ability to specify `Default` compression codec for columns that correspond to settings specified in `config.xml`. Implements: [#9074](https://github.com/ClickHouse/ClickHouse/issues/9074). [#14049](https://github.com/ClickHouse/ClickHouse/pull/14049) ([alesapin](https://github.com/alesapin)).
-* Added `date_trunc` function that truncates a date/time value to a specified date/time part. [#13888](https://github.com/ClickHouse/ClickHouse/pull/13888) ([Vladimir Golovchenko](https://github.com/vladimir-golovchenko)).
+* Support Kerberos authentication in Kafka, using `krb5` and `cyrus-sasl` libraries. [#12771](https://github.com/ClickHouse/ClickHouse/pull/12771) ([Ilya Golshtein](https://github.com/ilejn)).
+* Add function `normalizeQuery` that replaces literals, sequences of literals and complex aliases with placeholders. Add function `normalizedQueryHash` that returns identical 64bit hash values for similar queries. It helps to analyze query log. This closes [#11271](https://github.com/ClickHouse/ClickHouse/issues/11271). [#13816](https://github.com/ClickHouse/ClickHouse/pull/13816) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Add `time_zones` table. [#13880](https://github.com/ClickHouse/ClickHouse/pull/13880) ([Bharat Nallan](https://github.com/bharatnc)).
 * Add function `defaultValueOfTypeName` that returns the default value for a given type. [#13877](https://github.com/ClickHouse/ClickHouse/pull/13877) ([hcz](https://github.com/hczhcz)).
+* Add `countDigits(x)` function that count number of decimal digits in integer or decimal column. Add `isDecimalOverflow(d, [p])` function that checks if the value in Decimal column is out of its (or specified) precision. [#14151](https://github.com/ClickHouse/ClickHouse/pull/14151) ([Artem Zuikov](https://github.com/4ertus2)).
 * Add `quantileExactLow` and `quantileExactHigh` implementations with respective aliases for `medianExactLow` and `medianExactHigh`. [#13818](https://github.com/ClickHouse/ClickHouse/pull/13818) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add function `normalizeQuery` that replaces literals, sequences of literals and complex aliases with placeholders. Add function `normalizedQueryHash` that returns identical 64bit hash values for similar queries. It helps to analyze query log. This closes [#11271](https://github.com/ClickHouse/ClickHouse/issues/11271). [#13816](https://github.com/ClickHouse/ClickHouse/pull/13816) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Added `date_trunc` function that truncates a date/time value to a specified date/time part. [#13888](https://github.com/ClickHouse/ClickHouse/pull/13888) ([Vladimir Golovchenko](https://github.com/vladimir-golovchenko)).
 * Add new optional section `<user_directories>` to the main config. [#13425](https://github.com/ClickHouse/ClickHouse/pull/13425) ([Vitaly Baranov](https://github.com/vitlibar)).
 * Add `ALTER SAMPLE BY` statement that allows to change table sample clause. [#13280](https://github.com/ClickHouse/ClickHouse/pull/13280) ([Amos Bird](https://github.com/amosbird)).
 * Function `position` now supports optional `start_pos` argument. [#13237](https://github.com/ClickHouse/ClickHouse/pull/13237) ([vdimir](https://github.com/vdimir)).
-* Add types `Int128`, `Int256`, `UInt256` and related functions for them. Extend Decimals with Decimal256 (precision up to 76 digits). New types are under the setting `allow_experimental_bigint_types`. [#13097](https://github.com/ClickHouse/ClickHouse/pull/13097) ([Artem Zuikov](https://github.com/4ertus2)).
-* Support Kerberos authentication in Kafka, using `krb5` and `cyrus-sasl` libraries. [#12771](https://github.com/ClickHouse/ClickHouse/pull/12771) ([Ilya Golshtein](https://github.com/ilejn)).
-* Support `MaterializeMySQL` database engine. Implements [#4006](https://github.com/ClickHouse/ClickHouse/issues/4006). [#10851](https://github.com/ClickHouse/ClickHouse/pull/10851) ([Winter Zhang](https://github.com/zhang2014)).
 
 #### Bug Fix
 
 * Check for array size overflow in `topK` aggregate function. Without this check the user may send a query with carefully crafter parameters that will lead to server crash. This closes [#14452](https://github.com/ClickHouse/ClickHouse/issues/14452). [#14467](https://github.com/ClickHouse/ClickHouse/pull/14467) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Fix bug which leads to wrong merges assignment if table has partitions with a single part. [#14444](https://github.com/ClickHouse/ClickHouse/pull/14444) ([alesapin](https://github.com/alesapin)).
-* Stop query execution if exception happened in `PipelineExecutor` itself. This could prevent rare possible query hung. Continuation of [#14334](https://github.com/ClickHouse/ClickHouse/issues/14334). [#14402](https://github.com/ClickHouse/ClickHouse/pull/14402) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Stop query execution if exception happened in `PipelineExecutor` itself. This could prevent rare possible query hung. [#14334](https://github.com/ClickHouse/ClickHouse/pull/14334) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix bug which can lead to wrong merges assignment if table has partitions with a single part. [#14444](https://github.com/ClickHouse/ClickHouse/pull/14444) ([alesapin](https://github.com/alesapin)).
+* Stop query execution if exception happened in `PipelineExecutor` itself. This could prevent rare possible query hung. Continuation of [#14334](https://github.com/ClickHouse/ClickHouse/issues/14334). [#14402](https://github.com/ClickHouse/ClickHouse/pull/14402) [#14334](https://github.com/ClickHouse/ClickHouse/pull/14334) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
 * Fix crash during `ALTER` query for table which was created `AS table_function`. Fixes [#14212](https://github.com/ClickHouse/ClickHouse/issues/14212). [#14326](https://github.com/ClickHouse/ClickHouse/pull/14326) ([alesapin](https://github.com/alesapin)).
-* Fix exception during ALTER LIVE VIEW query with REFRESH command. [#14320](https://github.com/ClickHouse/ClickHouse/pull/14320) ([Bharat Nallan](https://github.com/bharatnc)).
+* Fix exception during ALTER LIVE VIEW query with REFRESH command. Live view is an experimental feature. [#14320](https://github.com/ClickHouse/ClickHouse/pull/14320) ([Bharat Nallan](https://github.com/bharatnc)).
 * Fix QueryPlan lifetime (for EXPLAIN PIPELINE graph=1) for queries with nested interpreter. [#14315](https://github.com/ClickHouse/ClickHouse/pull/14315) ([Azat Khuzhin](https://github.com/azat)).
 * Fix segfault in `clickhouse-odbc-bridge` during schema fetch from some external sources. This PR fixes https://github.com/ClickHouse/ClickHouse/issues/13861. [#14267](https://github.com/ClickHouse/ClickHouse/pull/14267) ([Vitaly Baranov](https://github.com/vitlibar)).
 * Disallows `CODEC` on `ALIAS` column type. Fixes [#13911](https://github.com/ClickHouse/ClickHouse/issues/13911). [#14263](https://github.com/ClickHouse/ClickHouse/pull/14263) ([Bharat Nallan](https://github.com/bharatnc)).
@@ -79,6 +76,7 @@
 
 #### Improvement
 
+* Add setting `min_index_granularity_bytes` that protects against accidentally creating a table with very low `index_granularity_bytes` setting. [#14139](https://github.com/ClickHouse/ClickHouse/pull/14139) ([Bharat Nallan](https://github.com/bharatnc)).
 * Now it's possible to `ALTER TABLE table_name FETCH PARTITION partition_expr FROM 'zk://<host>:<port>/path-in-zookeeper'`. It's useful for shipping data to new clusters. [#14155](https://github.com/ClickHouse/ClickHouse/pull/14155) ([Amos Bird](https://github.com/amosbird)).
 * Slightly better performance of Memory table if it was constructed from a huge number of very small blocks (that's unlikely). Author of the idea: [Mark Papadakis](https://github.com/markpapadakis). Closes [#14043](https://github.com/ClickHouse/ClickHouse/issues/14043). [#14056](https://github.com/ClickHouse/ClickHouse/pull/14056) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Conditional aggregate functions (for example: `avgIf`, `sumIf`, `maxIf`) should return `NULL` when miss rows and use nullable arguments. [#13964](https://github.com/ClickHouse/ClickHouse/pull/13964) ([Winter Zhang](https://github.com/zhang2014)).
@@ -111,6 +109,10 @@
 * Optimize `has()`, `indexOf()` and `countEqual()` functions for `Array(LowCardinality(T))` and constant right arguments. [#12550](https://github.com/ClickHouse/ClickHouse/pull/12550) ([myrrc](https://github.com/myrrc)).
 * When performing trivial `INSERT SELECT` queries, automatically set `max_threads` to 1 or `max_insert_threads`, and set `max_block_size` to `min_insert_block_size_rows`. Related to [#5907](https://github.com/ClickHouse/ClickHouse/issues/5907). [#12195](https://github.com/ClickHouse/ClickHouse/pull/12195) ([flynn](https://github.com/ucasFL)).
 
+#### Experimental Feature
+
+* Add types `Int128`, `Int256`, `UInt256` and related functions for them. Extend Decimals with Decimal256 (precision up to 76 digits). New types are under the setting `allow_experimental_bigint_types`. It is working extremely slow and bad. The implementation is incomplete. Please don't use this feature. [#13097](https://github.com/ClickHouse/ClickHouse/pull/13097) ([Artem Zuikov](https://github.com/4ertus2)).
+
 #### Build/Testing/Packaging Improvement
 
 * Actually there are no symlinks there, so `-type f` is enough ``` ~/workspace/ClickHouse/contrib/cctz/testdata/zoneinfo$ find . -type l -ls | wc -l 0 ``` Closes [#14209](https://github.com/ClickHouse/ClickHouse/issues/14209). [#14215](https://github.com/ClickHouse/ClickHouse/pull/14215) ([filimonov](https://github.com/filimonov)).

From f23798879e2c37c4ce28bf35d5fb91b54599c0eb Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 21:42:50 +0300
Subject: [PATCH 201/341] Update CHANGELOG.md

---
 CHANGELOG.md | 42 ++++++++++++++++++++----------------------
 1 file changed, 20 insertions(+), 22 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 6b30395e859..2752913f036 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -25,6 +25,8 @@
 
 #### Bug Fix
 
+* Fix visible data clobbering by progress bar in client in interactive mode. This fixes [#12562](https://github.com/ClickHouse/ClickHouse/issues/12562) and [#13369](https://github.com/ClickHouse/ClickHouse/issues/13369) and [#13584](https://github.com/ClickHouse/ClickHouse/issues/13584) and fixes [#12964](https://github.com/ClickHouse/ClickHouse/issues/12964). [#13691](https://github.com/ClickHouse/ClickHouse/pull/13691) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Fixed incorrect sorting order if `LowCardinality` column when sorting by multiple columns. This fixes [#13958](https://github.com/ClickHouse/ClickHouse/issues/13958). [#14223](https://github.com/ClickHouse/ClickHouse/pull/14223) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
 * Check for array size overflow in `topK` aggregate function. Without this check the user may send a query with carefully crafter parameters that will lead to server crash. This closes [#14452](https://github.com/ClickHouse/ClickHouse/issues/14452). [#14467](https://github.com/ClickHouse/ClickHouse/pull/14467) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Fix bug which can lead to wrong merges assignment if table has partitions with a single part. [#14444](https://github.com/ClickHouse/ClickHouse/pull/14444) ([alesapin](https://github.com/alesapin)).
 * Stop query execution if exception happened in `PipelineExecutor` itself. This could prevent rare possible query hung. Continuation of [#14334](https://github.com/ClickHouse/ClickHouse/issues/14334). [#14402](https://github.com/ClickHouse/ClickHouse/pull/14402) [#14334](https://github.com/ClickHouse/ClickHouse/pull/14334) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
@@ -32,50 +34,46 @@
 * Fix exception during ALTER LIVE VIEW query with REFRESH command. Live view is an experimental feature. [#14320](https://github.com/ClickHouse/ClickHouse/pull/14320) ([Bharat Nallan](https://github.com/bharatnc)).
 * Fix QueryPlan lifetime (for EXPLAIN PIPELINE graph=1) for queries with nested interpreter. [#14315](https://github.com/ClickHouse/ClickHouse/pull/14315) ([Azat Khuzhin](https://github.com/azat)).
 * Fix segfault in `clickhouse-odbc-bridge` during schema fetch from some external sources. This PR fixes https://github.com/ClickHouse/ClickHouse/issues/13861. [#14267](https://github.com/ClickHouse/ClickHouse/pull/14267) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Disallows `CODEC` on `ALIAS` column type. Fixes [#13911](https://github.com/ClickHouse/ClickHouse/issues/13911). [#14263](https://github.com/ClickHouse/ClickHouse/pull/14263) ([Bharat Nallan](https://github.com/bharatnc)).
-* Fix handling of empty transactions in `MaterializeMySQL` database engine. This fixes [#14235](https://github.com/ClickHouse/ClickHouse/issues/14235). [#14253](https://github.com/ClickHouse/ClickHouse/pull/14253) ([BohuTANG](https://github.com/BohuTANG)).
-* fixes [#14231](https://github.com/ClickHouse/ClickHouse/issues/14231) fix wrong lexer in MaterializeMySQL database engine dump stage. [#14232](https://github.com/ClickHouse/ClickHouse/pull/14232) ([Winter Zhang](https://github.com/zhang2014)).
-* Fix crash in mark inclusion search introduced in https://github.com/ClickHouse/ClickHouse/pull/12277 . [#14225](https://github.com/ClickHouse/ClickHouse/pull/14225) ([Amos Bird](https://github.com/amosbird)).
-* Fixed incorrect sorting order if LowCardinality column. This fixes [#13958](https://github.com/ClickHouse/ClickHouse/issues/13958). [#14223](https://github.com/ClickHouse/ClickHouse/pull/14223) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix crash in mark inclusion search introduced in https://github.com/ClickHouse/ClickHouse/pull/12277. [#14225](https://github.com/ClickHouse/ClickHouse/pull/14225) ([Amos Bird](https://github.com/amosbird)).
 * Fix creation of tables with named tuples. This fixes [#13027](https://github.com/ClickHouse/ClickHouse/issues/13027). [#14143](https://github.com/ClickHouse/ClickHouse/pull/14143) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Fix formatting of minimal negative decimal numbers. This fixes https://github.com/ClickHouse/ClickHouse/issues/14111. [#14119](https://github.com/ClickHouse/ClickHouse/pull/14119) ([Alexander Kuzmenkov](https://github.com/akuzm)).
-* When waiting for a dictionary update to complete, use the timeout specified by `query_wait_timeout_milliseconds` setting instead of a hard-coded value. [#14105](https://github.com/ClickHouse/ClickHouse/pull/14105) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix DistributedFilesToInsert metric (zeroed when it should not). [#14095](https://github.com/ClickHouse/ClickHouse/pull/14095) ([Azat Khuzhin](https://github.com/azat)).
-* Fix pointInPolygon with const 2d array as polygon. [#14079](https://github.com/ClickHouse/ClickHouse/pull/14079) ([Alexey Ilyukhov](https://github.com/livace)).
+* Fix `DistributedFilesToInsert` metric (zeroed when it should not). [#14095](https://github.com/ClickHouse/ClickHouse/pull/14095) ([Azat Khuzhin](https://github.com/azat)).
+* Fix `pointInPolygon` with const 2d array as polygon. [#14079](https://github.com/ClickHouse/ClickHouse/pull/14079) ([Alexey Ilyukhov](https://github.com/livace)).
 * Fixed wrong mount point in extra info for `Poco::Exception: no space left on device`. [#14050](https://github.com/ClickHouse/ClickHouse/pull/14050) ([tavplubix](https://github.com/tavplubix)).
 * Fix GRANT ALL statement when executed on a non-global level. [#13987](https://github.com/ClickHouse/ClickHouse/pull/13987) ([Vitaly Baranov](https://github.com/vitlibar)).
 * Fix parser to reject create table as table function with engine. [#13940](https://github.com/ClickHouse/ClickHouse/pull/13940) ([hcz](https://github.com/hczhcz)).
-* Fix wrong results in select queries with `DISTINCT` keyword in case `optimize_duplicate_order_by_and_distinct` setting is enabled. [#13925](https://github.com/ClickHouse/ClickHouse/pull/13925) ([Artem Zuikov](https://github.com/4ertus2)).
+* Fix wrong results in select queries with `DISTINCT` keyword and subqueries with UNION ALL in case `optimize_duplicate_order_by_and_distinct` setting is enabled. [#13925](https://github.com/ClickHouse/ClickHouse/pull/13925) ([Artem Zuikov](https://github.com/4ertus2)).
 * Fixed potential deadlock when renaming `Distributed` table. [#13922](https://github.com/ClickHouse/ClickHouse/pull/13922) ([tavplubix](https://github.com/tavplubix)).
-* Fix incorrect sorting for `FixedString` columns. Fixes [#13182](https://github.com/ClickHouse/ClickHouse/issues/13182). [#13887](https://github.com/ClickHouse/ClickHouse/pull/13887) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix topK/topKWeighted merge (with non-default parameters). [#13817](https://github.com/ClickHouse/ClickHouse/pull/13817) ([Azat Khuzhin](https://github.com/azat)).
+* Fix incorrect sorting for `FixedString` columns when sorting by multiple columns. Fixes [#13182](https://github.com/ClickHouse/ClickHouse/issues/13182). [#13887](https://github.com/ClickHouse/ClickHouse/pull/13887) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix potentially imprecise result of `topK`/`topKWeighted` merge (with non-default parameters). [#13817](https://github.com/ClickHouse/ClickHouse/pull/13817) ([Azat Khuzhin](https://github.com/azat)).
 * Fix reading from MergeTree table with INDEX of type SET fails when comparing against NULL. This fixes [#13686](https://github.com/ClickHouse/ClickHouse/issues/13686). [#13793](https://github.com/ClickHouse/ClickHouse/pull/13793) ([Amos Bird](https://github.com/amosbird)).
-* Fix arrayJoin() capturing in lambda (LOGICAL_ERROR). [#13792](https://github.com/ClickHouse/ClickHouse/pull/13792) ([Azat Khuzhin](https://github.com/azat)).
-* Fix step overflow in range(). [#13790](https://github.com/ClickHouse/ClickHouse/pull/13790) ([Azat Khuzhin](https://github.com/azat)).
+* Fix `arrayJoin` capturing in lambda (LOGICAL_ERROR). [#13792](https://github.com/ClickHouse/ClickHouse/pull/13792) ([Azat Khuzhin](https://github.com/azat)).
+* Add step overflow check in function `range`. [#13790](https://github.com/ClickHouse/ClickHouse/pull/13790) ([Azat Khuzhin](https://github.com/azat)).
 * Fixed `Directory not empty` error when concurrently executing `DROP DATABASE` and `CREATE TABLE`. [#13756](https://github.com/ClickHouse/ClickHouse/pull/13756) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Add range check for h3KRing function. This fixes [#13633](https://github.com/ClickHouse/ClickHouse/issues/13633). [#13752](https://github.com/ClickHouse/ClickHouse/pull/13752) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Add range check for `h3KRing` function. This fixes [#13633](https://github.com/ClickHouse/ClickHouse/issues/13633). [#13752](https://github.com/ClickHouse/ClickHouse/pull/13752) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Fix race condition between DETACH and background merges. Parts may revive after detach. This is continuation of [#8602](https://github.com/ClickHouse/ClickHouse/issues/8602) that did not fix the issue but introduced a test that started to fail in very rare cases, demonstrating the issue. [#13746](https://github.com/ClickHouse/ClickHouse/pull/13746) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Fix logging Settings.Names/Values when log_queries_min_type > QUERY_START. [#13737](https://github.com/ClickHouse/ClickHouse/pull/13737) ([Azat Khuzhin](https://github.com/azat)).
-* Fixes /replicas_status endpoint response status code when verbose=1. [#13722](https://github.com/ClickHouse/ClickHouse/pull/13722) ([javi santana](https://github.com/javisantana)).
+* Fixes `/replicas_status` endpoint response status code when verbose=1. [#13722](https://github.com/ClickHouse/ClickHouse/pull/13722) ([javi santana](https://github.com/javisantana)).
 * Fix incorrect message in `clickhouse-server.init` while checking user and group. [#13711](https://github.com/ClickHouse/ClickHouse/pull/13711) ([ylchou](https://github.com/ylchou)).
-* Fix visible data clobbering by progress bar in client in interactive mode. This fixes [#12562](https://github.com/ClickHouse/ClickHouse/issues/12562) and [#13369](https://github.com/ClickHouse/ClickHouse/issues/13369) and [#13584](https://github.com/ClickHouse/ClickHouse/issues/13584) and fixes [#12964](https://github.com/ClickHouse/ClickHouse/issues/12964). [#13691](https://github.com/ClickHouse/ClickHouse/pull/13691) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Do not optimize any(arrayJoin()) -> arrayJoin() under optimize_move_functions_out_of_any. [#13681](https://github.com/ClickHouse/ClickHouse/pull/13681) ([Azat Khuzhin](https://github.com/azat)).
+* Do not optimize any(arrayJoin()) -> arrayJoin() under `optimize_move_functions_out_of_any` setting. [#13681](https://github.com/ClickHouse/ClickHouse/pull/13681) ([Azat Khuzhin](https://github.com/azat)).
 * Fix crash in JOIN with StorageMerge and `set enable_optimize_predicate_expression=1`. [#13679](https://github.com/ClickHouse/ClickHouse/pull/13679) ([Artem Zuikov](https://github.com/4ertus2)).
 * Fix typo in error message about `The value of 'number_of_free_entries_in_pool_to_lower_max_size_of_merge' setting`. [#13678](https://github.com/ClickHouse/ClickHouse/pull/13678) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Concurrent `ALTER ... REPLACE/MOVE PARTITION ...` queries might cause deadlock. It's fixed. [#13626](https://github.com/ClickHouse/ClickHouse/pull/13626) ([tavplubix](https://github.com/tavplubix)).
 * Fixed the behaviour when sometimes cache-dictionary returned default value instead of present value from source. [#13624](https://github.com/ClickHouse/ClickHouse/pull/13624) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix secondary indices corruption in compact parts. [#13538](https://github.com/ClickHouse/ClickHouse/pull/13538) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix secondary indices corruption in compact parts. Compact parts are experimental feature. [#13538](https://github.com/ClickHouse/ClickHouse/pull/13538) ([Anton Popov](https://github.com/CurtizJ)).
 * Fix premature `ON CLUSTER` timeouts for queries that must be executed on a single replica. Fixes [#6704](https://github.com/ClickHouse/ClickHouse/issues/6704), [#7228](https://github.com/ClickHouse/ClickHouse/issues/7228), [#13361](https://github.com/ClickHouse/ClickHouse/issues/13361), [#11884](https://github.com/ClickHouse/ClickHouse/issues/11884). [#13450](https://github.com/ClickHouse/ClickHouse/pull/13450) ([alesapin](https://github.com/alesapin)).
 * Fix wrong code in function `netloc`. This fixes [#13335](https://github.com/ClickHouse/ClickHouse/issues/13335). [#13446](https://github.com/ClickHouse/ClickHouse/pull/13446) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Fix possible race in `StorageMemory`. https://clickhouse-test-reports.s3.yandex.net/0/9cac8a7244063d2092ad25d45502611e18d3749c/stress_test_(thread)/stderr.log Have no idea how to write a test. [#13416](https://github.com/ClickHouse/ClickHouse/pull/13416) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix missing or excessive headers in `TSV/CSVWithNames` formats. This fixes [#12504](https://github.com/ClickHouse/ClickHouse/issues/12504). [#13343](https://github.com/ClickHouse/ClickHouse/pull/13343) ([Azat Khuzhin](https://github.com/azat)).
+* Fix possible race in `StorageMemory`. [#13416](https://github.com/ClickHouse/ClickHouse/pull/13416) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix missing or excessive headers in `TSV/CSVWithNames` formats in HTTP protocol. This fixes [#12504](https://github.com/ClickHouse/ClickHouse/issues/12504). [#13343](https://github.com/ClickHouse/ClickHouse/pull/13343) ([Azat Khuzhin](https://github.com/azat)).
 * Fix parsing row policies from users.xml when names of databases or tables contain dots. This fixes https://github.com/ClickHouse/ClickHouse/issues/5779, https://github.com/ClickHouse/ClickHouse/issues/12527. [#13199](https://github.com/ClickHouse/ClickHouse/pull/13199) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix access to redis dictionary after connection was dropped once. It may happen with `cache` and `direct` dictionary layouts. [#13082](https://github.com/ClickHouse/ClickHouse/pull/13082) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix access to `redis` dictionary after connection was dropped once. It may happen with `cache` and `direct` dictionary layouts. [#13082](https://github.com/ClickHouse/ClickHouse/pull/13082) ([Anton Popov](https://github.com/CurtizJ)).
 * Removed wrong auth access check when using ClickHouseDictionarySource to query remote tables. [#12756](https://github.com/ClickHouse/ClickHouse/pull/12756) ([sundyli](https://github.com/sundy-li)).
-* subquery hash values are not enough to distinguish. https://github.com/ClickHouse/ClickHouse/issues/8333. [#8367](https://github.com/ClickHouse/ClickHouse/pull/8367) ([Amos Bird](https://github.com/amosbird)).
+* Properly distinguish subqueries in some cases for common subexpression elimination. https://github.com/ClickHouse/ClickHouse/issues/8333. [#8367](https://github.com/ClickHouse/ClickHouse/pull/8367) ([Amos Bird](https://github.com/amosbird)).
 
 #### Improvement
 
+* Disallows `CODEC` on `ALIAS` column type. Fixes [#13911](https://github.com/ClickHouse/ClickHouse/issues/13911). [#14263](https://github.com/ClickHouse/ClickHouse/pull/14263) ([Bharat Nallan](https://github.com/bharatnc)).
+* When waiting for a dictionary update to complete, use the timeout specified by `query_wait_timeout_milliseconds` setting instead of a hard-coded value. [#14105](https://github.com/ClickHouse/ClickHouse/pull/14105) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
 * Add setting `min_index_granularity_bytes` that protects against accidentally creating a table with very low `index_granularity_bytes` setting. [#14139](https://github.com/ClickHouse/ClickHouse/pull/14139) ([Bharat Nallan](https://github.com/bharatnc)).
 * Now it's possible to `ALTER TABLE table_name FETCH PARTITION partition_expr FROM 'zk://<host>:<port>/path-in-zookeeper'`. It's useful for shipping data to new clusters. [#14155](https://github.com/ClickHouse/ClickHouse/pull/14155) ([Amos Bird](https://github.com/amosbird)).
 * Slightly better performance of Memory table if it was constructed from a huge number of very small blocks (that's unlikely). Author of the idea: [Mark Papadakis](https://github.com/markpapadakis). Closes [#14043](https://github.com/ClickHouse/ClickHouse/issues/14043). [#14056](https://github.com/ClickHouse/ClickHouse/pull/14056) ([alexey-milovidov](https://github.com/alexey-milovidov)).

From bca73a75c6dd0448b46e9dafa73b3cdc246a2ad6 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 21:49:45 +0300
Subject: [PATCH 202/341] Update CHANGELOG.md

---
 CHANGELOG.md | 21 ++++++++++-----------
 1 file changed, 10 insertions(+), 11 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 2752913f036..07ff237c9b6 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -75,28 +75,27 @@
 * Disallows `CODEC` on `ALIAS` column type. Fixes [#13911](https://github.com/ClickHouse/ClickHouse/issues/13911). [#14263](https://github.com/ClickHouse/ClickHouse/pull/14263) ([Bharat Nallan](https://github.com/bharatnc)).
 * When waiting for a dictionary update to complete, use the timeout specified by `query_wait_timeout_milliseconds` setting instead of a hard-coded value. [#14105](https://github.com/ClickHouse/ClickHouse/pull/14105) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
 * Add setting `min_index_granularity_bytes` that protects against accidentally creating a table with very low `index_granularity_bytes` setting. [#14139](https://github.com/ClickHouse/ClickHouse/pull/14139) ([Bharat Nallan](https://github.com/bharatnc)).
-* Now it's possible to `ALTER TABLE table_name FETCH PARTITION partition_expr FROM 'zk://<host>:<port>/path-in-zookeeper'`. It's useful for shipping data to new clusters. [#14155](https://github.com/ClickHouse/ClickHouse/pull/14155) ([Amos Bird](https://github.com/amosbird)).
+* Now it's possible to fetch partitions from clusters that use different ZooKeeper: `ALTER TABLE table_name FETCH PARTITION partition_expr FROM 'zk-name:/path-in-zookeeper'`. It's useful for shipping data to new clusters. [#14155](https://github.com/ClickHouse/ClickHouse/pull/14155) ([Amos Bird](https://github.com/amosbird)).
 * Slightly better performance of Memory table if it was constructed from a huge number of very small blocks (that's unlikely). Author of the idea: [Mark Papadakis](https://github.com/markpapadakis). Closes [#14043](https://github.com/ClickHouse/ClickHouse/issues/14043). [#14056](https://github.com/ClickHouse/ClickHouse/pull/14056) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Conditional aggregate functions (for example: `avgIf`, `sumIf`, `maxIf`) should return `NULL` when miss rows and use nullable arguments. [#13964](https://github.com/ClickHouse/ClickHouse/pull/13964) ([Winter Zhang](https://github.com/zhang2014)).
 * Increase limit in -Resample combinator to 1M. [#13947](https://github.com/ClickHouse/ClickHouse/pull/13947) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
 * Corrected an error in AvroConfluent format that caused the Kafka table engine to stop processing messages when an abnormally small, malformed, message was received. [#13941](https://github.com/ClickHouse/ClickHouse/pull/13941) ([Gervasio Varela](https://github.com/gervarela)).
 * Fix wrong error for long queries. It was possible to get syntax error other than `Max query size exceeded` for correct query. [#13928](https://github.com/ClickHouse/ClickHouse/pull/13928) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Better error message for null value of TabSeparatedRow format. [#13906](https://github.com/ClickHouse/ClickHouse/pull/13906) ([jiang tao](https://github.com/tomjiang1987)).
+* Better error message for null value of `TabSeparated` format. [#13906](https://github.com/ClickHouse/ClickHouse/pull/13906) ([jiang tao](https://github.com/tomjiang1987)).
 * Function `arrayCompact` will compare NaNs bitwise if the type of array elements is Float32/Float64. In previous versions NaNs were always not equal if the type of array elements is Float32/Float64 and were always equal if the type is more complex, like Nullable(Float64). This closes [#13857](https://github.com/ClickHouse/ClickHouse/issues/13857). [#13868](https://github.com/ClickHouse/ClickHouse/pull/13868) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Fix data race in `lgamma` function. This race was caught only in `tsan`, no side effects a really happened. [#13842](https://github.com/ClickHouse/ClickHouse/pull/13842) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* 1. Add [GTID-Based Replication](https://dev.mysql.com/doc/refman/5.7/en/replication-gtids-concepts.html), it works even when replication topology changes, and supported/prefered in MySQL 5.6/5.7/8.0 2. Add BIT/SET filed type supports 3. Fix up varchar type meta length bug. [#13820](https://github.com/ClickHouse/ClickHouse/pull/13820) ([BohuTANG](https://github.com/BohuTANG)).
 * Avoid too slow queries when arrays are manipulated as fields. Throw exception instead. [#13753](https://github.com/ClickHouse/ClickHouse/pull/13753) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Added Redis requirepass authorization. [#13688](https://github.com/ClickHouse/ClickHouse/pull/13688) ([Ivan Torgashov](https://github.com/it1804)).
-* Add MergeTree Write-Ahead-Log(WAL) dump tool. [#13640](https://github.com/ClickHouse/ClickHouse/pull/13640) ([BohuTANG](https://github.com/BohuTANG)).
+* Added Redis requirepass authorization (for redis dictionary source). [#13688](https://github.com/ClickHouse/ClickHouse/pull/13688) ([Ivan Torgashov](https://github.com/it1804)).
+* Add MergeTree Write-Ahead-Log (WAL) dump tool. WAL is an experimental feature. [#13640](https://github.com/ClickHouse/ClickHouse/pull/13640) ([BohuTANG](https://github.com/BohuTANG)).
 * In previous versions `lcm` function may produce assertion violation in debug build if called with specifically crafted arguments. This fixes [#13368](https://github.com/ClickHouse/ClickHouse/issues/13368). [#13510](https://github.com/ClickHouse/ClickHouse/pull/13510) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Provide monotonicity for `toDate/toDateTime` functions in more cases. Now the input arguments are saturated more naturally and provides better monotonicity. [#13497](https://github.com/ClickHouse/ClickHouse/pull/13497) ([Amos Bird](https://github.com/amosbird)).
-* Support compound identifiers for custom settings. [#13496](https://github.com/ClickHouse/ClickHouse/pull/13496) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Move parts from DIskLocal to DiskS3 in parallel. [#13459](https://github.com/ClickHouse/ClickHouse/pull/13459) ([Pavel Kovalenko](https://github.com/Jokser)).
+* Provide monotonicity for `toDate/toDateTime` functions in more cases. Monotonicity information is used for index analysis (more complex queries will be able to use index). Now the input arguments are saturated more naturally and provides better monotonicity. [#13497](https://github.com/ClickHouse/ClickHouse/pull/13497) ([Amos Bird](https://github.com/amosbird)).
+* Support compound identifiers for custom settings. Custom settings is an integration point of ClickHouse codebase with other codebases (no benefits for ClickHouse itself) [#13496](https://github.com/ClickHouse/ClickHouse/pull/13496) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Move parts from DiskLocal to DiskS3 in parallel. `DiskS3` is an experimental feature. [#13459](https://github.com/ClickHouse/ClickHouse/pull/13459) ([Pavel Kovalenko](https://github.com/Jokser)).
 * Enable mixed granularity parts by default. [#13449](https://github.com/ClickHouse/ClickHouse/pull/13449) ([alesapin](https://github.com/alesapin)).
 * Proper remote host checking in S3 redirects (security-related thing). [#13404](https://github.com/ClickHouse/ClickHouse/pull/13404) ([Vladimir Chebotarev](https://github.com/excitoon)).
-* Add QueryTimeMicroseconds, SelectQueryTimeMicroseconds and InsertQueryTimeMicroseconds to system.events. [#13336](https://github.com/ClickHouse/ClickHouse/pull/13336) ([ianton-ru](https://github.com/ianton-ru)).
-* Fix assert when decimal has too large negative exponent. Fixes [#13188](https://github.com/ClickHouse/ClickHouse/issues/13188). [#13228](https://github.com/ClickHouse/ClickHouse/pull/13228) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Added cache layer for DiskS3 (cache to local disk mark and index files). [#13076](https://github.com/ClickHouse/ClickHouse/pull/13076) ([Pavel Kovalenko](https://github.com/Jokser)).
+* Add `QueryTimeMicroseconds`, `SelectQueryTimeMicroseconds` and `InsertQueryTimeMicroseconds` to system.events. [#13336](https://github.com/ClickHouse/ClickHouse/pull/13336) ([ianton-ru](https://github.com/ianton-ru)).
+* Fix debug assertion when Decimal has too large negative exponent. Fixes [#13188](https://github.com/ClickHouse/ClickHouse/issues/13188). [#13228](https://github.com/ClickHouse/ClickHouse/pull/13228) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Added cache layer for DiskS3 (cache to local disk mark and index files). `DiskS3` is an experimental feature. [#13076](https://github.com/ClickHouse/ClickHouse/pull/13076) ([Pavel Kovalenko](https://github.com/Jokser)).
 
 #### Performance Improvement
 

From 493b9b696ee88908694347614f3014e81a143942 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 21:57:50 +0300
Subject: [PATCH 203/341] Update CHANGELOG.md

---
 CHANGELOG.md | 39 +++++++++++++++++----------------------
 1 file changed, 17 insertions(+), 22 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 07ff237c9b6..e1764f07acf 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -96,11 +96,13 @@
 * Add `QueryTimeMicroseconds`, `SelectQueryTimeMicroseconds` and `InsertQueryTimeMicroseconds` to system.events. [#13336](https://github.com/ClickHouse/ClickHouse/pull/13336) ([ianton-ru](https://github.com/ianton-ru)).
 * Fix debug assertion when Decimal has too large negative exponent. Fixes [#13188](https://github.com/ClickHouse/ClickHouse/issues/13188). [#13228](https://github.com/ClickHouse/ClickHouse/pull/13228) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Added cache layer for DiskS3 (cache to local disk mark and index files). `DiskS3` is an experimental feature. [#13076](https://github.com/ClickHouse/ClickHouse/pull/13076) ([Pavel Kovalenko](https://github.com/Jokser)).
+* Fix readline so it dumps history to file now. [#13600](https://github.com/ClickHouse/ClickHouse/pull/13600) ([Amos Bird](https://github.com/amosbird)).
+* Create `system` database with `Atomic` engine by default (a preparation to enable `Atomic` database engine by default everywhere). [#13680](https://github.com/ClickHouse/ClickHouse/pull/13680) ([tavplubix](https://github.com/tavplubix)).
 
 #### Performance Improvement
 
-* Slightly optimize very short queries with LowCardinality. [#14129](https://github.com/ClickHouse/ClickHouse/pull/14129) ([Anton Popov](https://github.com/CurtizJ)).
-* Enable parallel INSERTs for table engines `Null`, `Memory`, `Distributed` and `Buffer`. [#14120](https://github.com/ClickHouse/ClickHouse/pull/14120) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Slightly optimize very short queries with `LowCardinality`. [#14129](https://github.com/ClickHouse/ClickHouse/pull/14129) ([Anton Popov](https://github.com/CurtizJ)).
+* Enable parallel INSERTs for table engines `Null`, `Memory`, `Distributed` and `Buffer` when the setting `max_insert_threads` is set. [#14120](https://github.com/ClickHouse/ClickHouse/pull/14120) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Fail fast if `max_rows_to_read` limit is exceeded on parts scan. The motivation behind this change is to skip ranges scan for all selected parts if it is clear that `max_rows_to_read` is already exceeded. The change is quite noticeable for queries over big number of parts. [#13677](https://github.com/ClickHouse/ClickHouse/pull/13677) ([Roman Khavronenko](https://github.com/hagen1778)).
 * Slightly improve performance of aggregation by UInt8/UInt16 keys. [#13099](https://github.com/ClickHouse/ClickHouse/pull/13099) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Optimize `has()`, `indexOf()` and `countEqual()` functions for `Array(LowCardinality(T))` and constant right arguments. [#12550](https://github.com/ClickHouse/ClickHouse/pull/12550) ([myrrc](https://github.com/myrrc)).
@@ -112,38 +114,31 @@
 
 #### Build/Testing/Packaging Improvement
 
-* Actually there are no symlinks there, so `-type f` is enough ``` ~/workspace/ClickHouse/contrib/cctz/testdata/zoneinfo$ find . -type l -ls | wc -l 0 ``` Closes [#14209](https://github.com/ClickHouse/ClickHouse/issues/14209). [#14215](https://github.com/ClickHouse/ClickHouse/pull/14215) ([filimonov](https://github.com/filimonov)).
-* Switch tests docker images to use test-base parent. [#14167](https://github.com/ClickHouse/ClickHouse/pull/14167) ([Ilya Yatsishin](https://github.com/qoega)).
+* Added `clickhouse install` script, that is useful if you only have a single binary. [#13528](https://github.com/ClickHouse/ClickHouse/pull/13528) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Allow to run `clickhouse` binary without configuration. [#13515](https://github.com/ClickHouse/ClickHouse/pull/13515) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Enable check for typos in code with `codespell`. [#13513](https://github.com/ClickHouse/ClickHouse/pull/13513) [#13511](https://github.com/ClickHouse/ClickHouse/pull/13511) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Enable Shellcheck in CI as a linter of .sh tests. This closes [#13168](https://github.com/ClickHouse/ClickHouse/issues/13168). [#13530](https://github.com/ClickHouse/ClickHouse/pull/13530) [#13529](https://github.com/ClickHouse/ClickHouse/pull/13529) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Add a CMake option to fail configuration instead of auto-reconfiguration, enabled by default. [#13687](https://github.com/ClickHouse/ClickHouse/pull/13687) ([Konstantin](https://github.com/podshumok)).
+* Expose version of embedded tzdata via TZDATA_VERSION in system.build_options. [#13648](https://github.com/ClickHouse/ClickHouse/pull/13648) ([filimonov](https://github.com/filimonov)).
+* Improve generation of system.time_zones table during build. Closes [#14209](https://github.com/ClickHouse/ClickHouse/issues/14209). [#14215](https://github.com/ClickHouse/ClickHouse/pull/14215) ([filimonov](https://github.com/filimonov)).
+* Build ClickHouse with the most fresh tzdata from package repository. [#13623](https://github.com/ClickHouse/ClickHouse/pull/13623) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Add the ability to write js-style comments in skip_list.json. [#14159](https://github.com/ClickHouse/ClickHouse/pull/14159) ([alesapin](https://github.com/alesapin)).
-* * Adding retry logic when bringing up docker-compose cluster * Increasing COMPOSE_HTTP_TIMEOUT. [#14112](https://github.com/ClickHouse/ClickHouse/pull/14112) ([vzakaznikov](https://github.com/vzakaznikov)).
-* Enabled text-log in stress test to find more bugs. [#13855](https://github.com/ClickHouse/ClickHouse/pull/13855) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Ensure that there is no copy-pasted GPL code. [#13514](https://github.com/ClickHouse/ClickHouse/pull/13514) ([alexey-milovidov](https://github.com/alexey-milovidov)).
+* Switch tests docker images to use test-base parent. [#14167](https://github.com/ClickHouse/ClickHouse/pull/14167) ([Ilya Yatsishin](https://github.com/qoega)).
+* Adding retry logic when bringing up docker-compose cluster; Increasing COMPOSE_HTTP_TIMEOUT. [#14112](https://github.com/ClickHouse/ClickHouse/pull/14112) ([vzakaznikov](https://github.com/vzakaznikov)).
+* Enabled `system.text_log` in stress test to find more bugs. [#13855](https://github.com/ClickHouse/ClickHouse/pull/13855) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
 * Testflows LDAP module: adding missing certificates and dhparam.pem for openldap4. [#13780](https://github.com/ClickHouse/ClickHouse/pull/13780) ([vzakaznikov](https://github.com/vzakaznikov)).
 * ZooKeeper cannot work reliably in unit tests in CI infrastructure. Using unit tests for ZooKeeper interaction with real ZooKeeper is bad idea from the start (unit tests are not supposed to verify complex distributed systems). We already using integration tests for this purpose and they are better suited. [#13745](https://github.com/ClickHouse/ClickHouse/pull/13745) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Added docker image for style check. Added style check that all docker and docker compose files are located in docker directory. [#13724](https://github.com/ClickHouse/ClickHouse/pull/13724) ([Ilya Yatsishin](https://github.com/qoega)).
-* FIx cassandra build on Mac OS. [#13708](https://github.com/ClickHouse/ClickHouse/pull/13708) ([Ilya Yatsishin](https://github.com/qoega)).
+* Fix cassandra build on Mac OS. [#13708](https://github.com/ClickHouse/ClickHouse/pull/13708) ([Ilya Yatsishin](https://github.com/qoega)).
 * Fix link error in shared build. [#13700](https://github.com/ClickHouse/ClickHouse/pull/13700) ([Amos Bird](https://github.com/amosbird)).
-* Add a CMake option to fail configuration instead of auto-reconfiguration, enabled by default. [#13687](https://github.com/ClickHouse/ClickHouse/pull/13687) ([Konstantin](https://github.com/podshumok)).
 * Updating LDAP user authentication suite to check that it works with RBAC. [#13656](https://github.com/ClickHouse/ClickHouse/pull/13656) ([vzakaznikov](https://github.com/vzakaznikov)).
-* Expose version of embedded tzdata via TZDATA_VERSION in system.build_options. [#13648](https://github.com/ClickHouse/ClickHouse/pull/13648) ([filimonov](https://github.com/filimonov)).
 * Removed `-DENABLE_CURL_CLIENT` for `contrib/aws`. [#13628](https://github.com/ClickHouse/ClickHouse/pull/13628) ([Vladimir Chebotarev](https://github.com/excitoon)).
-* Build ClickHouse with the most fresh tzdata from package repository. [#13623](https://github.com/ClickHouse/ClickHouse/pull/13623) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Increasing health-check timeouts for ClickHouse nodes and adding support to dump docker-compose logs if unhealthy containers found. [#13612](https://github.com/ClickHouse/ClickHouse/pull/13612) ([vzakaznikov](https://github.com/vzakaznikov)).
 * Make sure https://github.com/ClickHouse/ClickHouse/issues/10977 is invalid. [#13539](https://github.com/ClickHouse/ClickHouse/pull/13539) ([Amos Bird](https://github.com/amosbird)).
-* Enable Shellcheck in CI as a linter of .sh tests. This closes [#13168](https://github.com/ClickHouse/ClickHouse/issues/13168). [#13530](https://github.com/ClickHouse/ClickHouse/pull/13530) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Fix the remaining shellcheck notices. A preparation to enable Shellcheck. [#13529](https://github.com/ClickHouse/ClickHouse/pull/13529) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Added `clickhouse install` script, that is useful if you only have a single binary. [#13528](https://github.com/ClickHouse/ClickHouse/pull/13528) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Allow to run `clickhouse` binary without configuration. [#13515](https://github.com/ClickHouse/ClickHouse/pull/13515) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Ensure that there is no copy-pasted GPL code. [#13514](https://github.com/ClickHouse/ClickHouse/pull/13514) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Enable check for typos in code with `codespell`. [#13513](https://github.com/ClickHouse/ClickHouse/pull/13513) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Fix typos in code with codespell. [#13511](https://github.com/ClickHouse/ClickHouse/pull/13511) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Skip PR's from robot-clickhouse. [#13489](https://github.com/ClickHouse/ClickHouse/pull/13489) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
 * Move Dockerfiles from integration tests to `docker/test` directory. docker_compose files are available in `runner` docker container. Docker images are built in CI and not in integration tests. [#13448](https://github.com/ClickHouse/ClickHouse/pull/13448) ([Ilya Yatsishin](https://github.com/qoega)).
 
-#### Other
-
-* Create `system` database with `Atomic` engine by default. [#13680](https://github.com/ClickHouse/ClickHouse/pull/13680) ([tavplubix](https://github.com/tavplubix)).
-* Fix readline so it dumps history to file now. [#13600](https://github.com/ClickHouse/ClickHouse/pull/13600) ([Amos Bird](https://github.com/amosbird)).
-
 
 ## ClickHouse release 20.7
 

From e96256d367c351f2fd38d321c5e53feb4e77234e Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 14 Sep 2020 22:15:25 +0300
Subject: [PATCH 204/341] Trying to improve performance

---
 src/Compression/CompressionCodecDelta.cpp     |  7 +---
 src/Compression/CompressionCodecDelta.h       |  2 -
 .../CompressionCodecDoubleDelta.cpp           |  6 +--
 src/Compression/CompressionCodecDoubleDelta.h |  2 -
 src/Compression/CompressionCodecGorilla.cpp   |  6 +--
 src/Compression/CompressionCodecGorilla.h     |  2 -
 src/Compression/CompressionCodecLZ4.cpp       | 16 +++-----
 src/Compression/CompressionCodecLZ4.h         |  9 ++--
 src/Compression/CompressionCodecMultiple.cpp  | 14 +++----
 src/Compression/CompressionCodecMultiple.h    |  2 -
 src/Compression/CompressionCodecNone.cpp      | 10 ++---
 src/Compression/CompressionCodecNone.h        |  4 +-
 src/Compression/CompressionCodecT64.cpp       | 11 ++---
 src/Compression/CompressionCodecT64.h         |  7 +---
 src/Compression/CompressionCodecZSTD.cpp      |  8 +---
 src/Compression/CompressionCodecZSTD.h        |  2 -
 src/Compression/ICompressionCodec.cpp         | 41 +++++++++++++++++--
 src/Compression/ICompressionCodec.h           |  7 +++-
 src/Storages/MergeTree/MergeSelector.h        |  2 +-
 .../MergeTree/MergeTreeDataMergerMutator.cpp  |  2 +-
 src/Storages/MergeTree/TTLMergeSelector.cpp   |  6 +--
 21 files changed, 81 insertions(+), 85 deletions(-)

diff --git a/src/Compression/CompressionCodecDelta.cpp b/src/Compression/CompressionCodecDelta.cpp
index ecb7c36b205..a10d2589576 100644
--- a/src/Compression/CompressionCodecDelta.cpp
+++ b/src/Compression/CompressionCodecDelta.cpp
@@ -23,6 +23,7 @@ namespace ErrorCodes
 CompressionCodecDelta::CompressionCodecDelta(UInt8 delta_bytes_size_)
     : delta_bytes_size(delta_bytes_size_)
 {
+    setCodecDescription("Delta", {std::make_shared<ASTLiteral>(static_cast<UInt64>(delta_bytes_size))});
 }
 
 uint8_t CompressionCodecDelta::getMethodByte() const
@@ -30,12 +31,6 @@ uint8_t CompressionCodecDelta::getMethodByte() const
     return static_cast<uint8_t>(CompressionMethodByte::Delta);
 }
 
-ASTPtr CompressionCodecDelta::getCodecDesc() const
-{
-    auto literal = std::make_shared<ASTLiteral>(static_cast<UInt64>(delta_bytes_size));
-    return makeASTFunction("Delta", literal);
-}
-
 void CompressionCodecDelta::updateHash(SipHash & hash) const
 {
     getCodecDesc()->updateTreeHash(hash);
diff --git a/src/Compression/CompressionCodecDelta.h b/src/Compression/CompressionCodecDelta.h
index a192fab051a..e892aa04242 100644
--- a/src/Compression/CompressionCodecDelta.h
+++ b/src/Compression/CompressionCodecDelta.h
@@ -12,8 +12,6 @@ public:
 
     uint8_t getMethodByte() const override;
 
-    ASTPtr getCodecDesc() const override;
-
     void updateHash(SipHash & hash) const override;
 
 protected:
diff --git a/src/Compression/CompressionCodecDoubleDelta.cpp b/src/Compression/CompressionCodecDoubleDelta.cpp
index dd2e95a916d..2c18b1e1127 100644
--- a/src/Compression/CompressionCodecDoubleDelta.cpp
+++ b/src/Compression/CompressionCodecDoubleDelta.cpp
@@ -327,6 +327,7 @@ UInt8 getDataBytesSize(DataTypePtr column_type)
 CompressionCodecDoubleDelta::CompressionCodecDoubleDelta(UInt8 data_bytes_size_)
     : data_bytes_size(data_bytes_size_)
 {
+    setCodecDescription("DoubleDelta", {});
 }
 
 uint8_t CompressionCodecDoubleDelta::getMethodByte() const
@@ -334,11 +335,6 @@ uint8_t CompressionCodecDoubleDelta::getMethodByte() const
     return static_cast<uint8_t>(CompressionMethodByte::DoubleDelta);
 }
 
-ASTPtr CompressionCodecDoubleDelta::getCodecDesc() const
-{
-    return std::make_shared<ASTIdentifier>("DoubleDelta");
-}
-
 void CompressionCodecDoubleDelta::updateHash(SipHash & hash) const
 {
     getCodecDesc()->updateTreeHash(hash);
diff --git a/src/Compression/CompressionCodecDoubleDelta.h b/src/Compression/CompressionCodecDoubleDelta.h
index 30ef086077d..11140ded61e 100644
--- a/src/Compression/CompressionCodecDoubleDelta.h
+++ b/src/Compression/CompressionCodecDoubleDelta.h
@@ -98,8 +98,6 @@ public:
 
     uint8_t getMethodByte() const override;
 
-    ASTPtr getCodecDesc() const override;
-
     void updateHash(SipHash & hash) const override;
 
 protected:
diff --git a/src/Compression/CompressionCodecGorilla.cpp b/src/Compression/CompressionCodecGorilla.cpp
index 3d08734fe91..0f622e5ccaa 100644
--- a/src/Compression/CompressionCodecGorilla.cpp
+++ b/src/Compression/CompressionCodecGorilla.cpp
@@ -242,6 +242,7 @@ UInt8 getDataBytesSize(DataTypePtr column_type)
 CompressionCodecGorilla::CompressionCodecGorilla(UInt8 data_bytes_size_)
     : data_bytes_size(data_bytes_size_)
 {
+    setCodecDescription("DoubleDelta", {});
 }
 
 uint8_t CompressionCodecGorilla::getMethodByte() const
@@ -249,11 +250,6 @@ uint8_t CompressionCodecGorilla::getMethodByte() const
     return static_cast<uint8_t>(CompressionMethodByte::Gorilla);
 }
 
-ASTPtr CompressionCodecGorilla::getCodecDesc() const
-{
-    return std::make_shared<ASTIdentifier>("Gorilla");
-}
-
 void CompressionCodecGorilla::updateHash(SipHash & hash) const
 {
     getCodecDesc()->updateTreeHash(hash);
diff --git a/src/Compression/CompressionCodecGorilla.h b/src/Compression/CompressionCodecGorilla.h
index df0f329dc31..3613ab2a96f 100644
--- a/src/Compression/CompressionCodecGorilla.h
+++ b/src/Compression/CompressionCodecGorilla.h
@@ -95,8 +95,6 @@ public:
 
     uint8_t getMethodByte() const override;
 
-    ASTPtr getCodecDesc() const override;
-
     void updateHash(SipHash & hash) const override;
 
 protected:
diff --git a/src/Compression/CompressionCodecLZ4.cpp b/src/Compression/CompressionCodecLZ4.cpp
index 1370349d68d..5f43b49706f 100644
--- a/src/Compression/CompressionCodecLZ4.cpp
+++ b/src/Compression/CompressionCodecLZ4.cpp
@@ -24,17 +24,16 @@ extern const int ILLEGAL_SYNTAX_FOR_CODEC_TYPE;
 extern const int ILLEGAL_CODEC_PARAMETER;
 }
 
+CompressionCodecLZ4::CompressionCodecLZ4()
+{
+    setCodecDescription("LZ4");
+}
 
 uint8_t CompressionCodecLZ4::getMethodByte() const
 {
     return static_cast<uint8_t>(CompressionMethodByte::LZ4);
 }
 
-ASTPtr CompressionCodecLZ4::getCodecDesc() const
-{
-    return std::make_shared<ASTIdentifier>("LZ4");
-}
-
 void CompressionCodecLZ4::updateHash(SipHash & hash) const
 {
     getCodecDesc()->updateTreeHash(hash);
@@ -63,12 +62,6 @@ void registerCodecLZ4(CompressionCodecFactory & factory)
     });
 }
 
-ASTPtr CompressionCodecLZ4HC::getCodecDesc() const
-{
-    auto literal = std::make_shared<ASTLiteral>(static_cast<UInt64>(level));
-    return makeASTFunction("LZ4HC", literal);
-}
-
 UInt32 CompressionCodecLZ4HC::doCompressData(const char * source, UInt32 source_size, char * dest) const
 {
     auto success = LZ4_compress_HC(source, dest, source_size, LZ4_COMPRESSBOUND(source_size), level);
@@ -105,6 +98,7 @@ void registerCodecLZ4HC(CompressionCodecFactory & factory)
 CompressionCodecLZ4HC::CompressionCodecLZ4HC(int level_)
     : level(level_)
 {
+    setCodecDescription("LZ4HC", {std::make_shared<ASTLiteral>(static_cast<UInt64>(level))});
 }
 
 }
diff --git a/src/Compression/CompressionCodecLZ4.h b/src/Compression/CompressionCodecLZ4.h
index 229e25481e6..bf8b4e2dd1f 100644
--- a/src/Compression/CompressionCodecLZ4.h
+++ b/src/Compression/CompressionCodecLZ4.h
@@ -5,6 +5,7 @@
 #include <IO/BufferWithOwnMemory.h>
 #include <Parsers/StringRange.h>
 #include <Compression/LZ4_decompress_faster.h>
+#include <Parsers/IAST_fwd.h>
 
 namespace DB
 {
@@ -12,9 +13,9 @@ namespace DB
 class CompressionCodecLZ4 : public ICompressionCodec
 {
 public:
-    uint8_t getMethodByte() const override;
+    CompressionCodecLZ4();
 
-    ASTPtr getCodecDesc() const override;
+    uint8_t getMethodByte() const override;
 
     UInt32 getAdditionalSizeAtTheEndOfBuffer() const override { return LZ4::ADDITIONAL_BYTES_AT_END_OF_BUFFER; }
 
@@ -32,17 +33,15 @@ private:
     UInt32 getMaxCompressedDataSize(UInt32 uncompressed_size) const override;
 
     mutable LZ4::PerformanceStatistics lz4_stat;
+    ASTPtr codec_desc;
 };
 
 
 class CompressionCodecLZ4HC : public CompressionCodecLZ4
 {
 public:
-
     CompressionCodecLZ4HC(int level_);
 
-    ASTPtr getCodecDesc() const override;
-
 protected:
     UInt32 doCompressData(const char * source, UInt32 source_size, char * dest) const override;
 
diff --git a/src/Compression/CompressionCodecMultiple.cpp b/src/Compression/CompressionCodecMultiple.cpp
index 77f0fc132fe..7c95db0c972 100644
--- a/src/Compression/CompressionCodecMultiple.cpp
+++ b/src/Compression/CompressionCodecMultiple.cpp
@@ -4,6 +4,7 @@
 #include <common/unaligned.h>
 #include <Compression/CompressionFactory.h>
 #include <Parsers/ASTExpressionList.h>
+#include <Parsers/ASTFunction.h>
 #include <IO/WriteHelpers.h>
 #include <IO/WriteBufferFromString.h>
 #include <IO/Operators.h>
@@ -22,6 +23,11 @@ namespace ErrorCodes
 CompressionCodecMultiple::CompressionCodecMultiple(Codecs codecs_)
     : codecs(codecs_)
 {
+    ASTs arguments;
+    for (const auto & codec : codecs)
+        arguments.push_back(codec->getCodecDesc());
+
+    setCodecDescription("", arguments);
 }
 
 uint8_t CompressionCodecMultiple::getMethodByte() const
@@ -29,14 +35,6 @@ uint8_t CompressionCodecMultiple::getMethodByte() const
     return static_cast<uint8_t>(CompressionMethodByte::Multiple);
 }
 
-ASTPtr CompressionCodecMultiple::getCodecDesc() const
-{
-    auto result = std::make_shared<ASTExpressionList>();
-    for (const auto & codec : codecs)
-        result->children.push_back(codec->getCodecDesc());
-    return result;
-}
-
 void CompressionCodecMultiple::updateHash(SipHash & hash) const
 {
     for (const auto & codec : codecs)
diff --git a/src/Compression/CompressionCodecMultiple.h b/src/Compression/CompressionCodecMultiple.h
index 6bac189bdf7..1eb61842048 100644
--- a/src/Compression/CompressionCodecMultiple.h
+++ b/src/Compression/CompressionCodecMultiple.h
@@ -13,8 +13,6 @@ public:
 
     uint8_t getMethodByte() const override;
 
-    ASTPtr getCodecDesc() const override;
-
     UInt32 getMaxCompressedDataSize(UInt32 uncompressed_size) const override;
 
     static std::vector<uint8_t> getCodecsBytesFromData(const char * source);
diff --git a/src/Compression/CompressionCodecNone.cpp b/src/Compression/CompressionCodecNone.cpp
index f727c4b4860..84bcb5bd841 100644
--- a/src/Compression/CompressionCodecNone.cpp
+++ b/src/Compression/CompressionCodecNone.cpp
@@ -7,16 +7,16 @@
 namespace DB
 {
 
+CompressionCodecNone::CompressionCodecNone()
+{
+    setCodecDescription("NONE");
+}
+
 uint8_t CompressionCodecNone::getMethodByte() const
 {
     return static_cast<uint8_t>(CompressionMethodByte::NONE);
 }
 
-ASTPtr CompressionCodecNone::getCodecDesc() const
-{
-    return std::make_shared<ASTIdentifier>("NONE");
-}
-
 void CompressionCodecNone::updateHash(SipHash & hash) const
 {
     getCodecDesc()->updateTreeHash(hash);
diff --git a/src/Compression/CompressionCodecNone.h b/src/Compression/CompressionCodecNone.h
index 370ef301694..bf6bb6de4e2 100644
--- a/src/Compression/CompressionCodecNone.h
+++ b/src/Compression/CompressionCodecNone.h
@@ -11,9 +11,9 @@ namespace DB
 class CompressionCodecNone : public ICompressionCodec
 {
 public:
-    uint8_t getMethodByte() const override;
+    CompressionCodecNone();
 
-    ASTPtr getCodecDesc() const override;
+    uint8_t getMethodByte() const override;
 
     void updateHash(SipHash & hash) const override;
 
diff --git a/src/Compression/CompressionCodecT64.cpp b/src/Compression/CompressionCodecT64.cpp
index 30972a5fe1f..f081652f613 100644
--- a/src/Compression/CompressionCodecT64.cpp
+++ b/src/Compression/CompressionCodecT64.cpp
@@ -637,13 +637,14 @@ uint8_t CompressionCodecT64::getMethodByte() const
     return codecId();
 }
 
-ASTPtr CompressionCodecT64::getCodecDesc() const
+CompressionCodecT64::CompressionCodecT64(TypeIndex type_idx_, Variant variant_)
+    : type_idx(type_idx_)
+    , variant(variant_)
 {
     if (variant == Variant::Byte)
-        return std::make_shared<ASTIdentifier>("T64");
-
-    auto literal = std::make_shared<ASTLiteral>("bit");
-    return makeASTFunction("T64", literal);
+        setCodecDescription("T64");
+    else
+        setCodecDescription("T64", {std::make_shared<ASTLiteral>("bit")});
 }
 
 void CompressionCodecT64::updateHash(SipHash & hash) const
diff --git a/src/Compression/CompressionCodecT64.h b/src/Compression/CompressionCodecT64.h
index 9671eb81ce1..9f8ec7cc4d5 100644
--- a/src/Compression/CompressionCodecT64.h
+++ b/src/Compression/CompressionCodecT64.h
@@ -26,15 +26,10 @@ public:
         Bit
     };
 
-    CompressionCodecT64(TypeIndex type_idx_, Variant variant_)
-        : type_idx(type_idx_)
-        , variant(variant_)
-    {}
+    CompressionCodecT64(TypeIndex type_idx_, Variant variant_);
 
     uint8_t getMethodByte() const override;
 
-    ASTPtr getCodecDesc() const override;
-
     void updateHash(SipHash & hash) const override;
 
 protected:
diff --git a/src/Compression/CompressionCodecZSTD.cpp b/src/Compression/CompressionCodecZSTD.cpp
index 3b317884fec..f236c4bf460 100644
--- a/src/Compression/CompressionCodecZSTD.cpp
+++ b/src/Compression/CompressionCodecZSTD.cpp
@@ -25,13 +25,6 @@ uint8_t CompressionCodecZSTD::getMethodByte() const
     return static_cast<uint8_t>(CompressionMethodByte::ZSTD);
 }
 
-
-ASTPtr CompressionCodecZSTD::getCodecDesc() const
-{
-    auto literal = std::make_shared<ASTLiteral>(static_cast<UInt64>(level));
-    return makeASTFunction("ZSTD", literal);
-}
-
 void CompressionCodecZSTD::updateHash(SipHash & hash) const
 {
     getCodecDesc()->updateTreeHash(hash);
@@ -65,6 +58,7 @@ void CompressionCodecZSTD::doDecompressData(const char * source, UInt32 source_s
 CompressionCodecZSTD::CompressionCodecZSTD(int level_)
     : level(level_)
 {
+    setCodecDescription("ZSTD", {std::make_shared<ASTLiteral>(static_cast<UInt64>(level))});
 }
 
 void registerCodecZSTD(CompressionCodecFactory & factory)
diff --git a/src/Compression/CompressionCodecZSTD.h b/src/Compression/CompressionCodecZSTD.h
index 3bfb6bb1d4d..903af6d6c1b 100644
--- a/src/Compression/CompressionCodecZSTD.h
+++ b/src/Compression/CompressionCodecZSTD.h
@@ -17,8 +17,6 @@ public:
 
     uint8_t getMethodByte() const override;
 
-    ASTPtr getCodecDesc() const override;
-
     UInt32 getMaxCompressedDataSize(UInt32 uncompressed_size) const override;
 
     void updateHash(SipHash & hash) const override;
diff --git a/src/Compression/ICompressionCodec.cpp b/src/Compression/ICompressionCodec.cpp
index 5de015b2680..4efe0c0ef3c 100644
--- a/src/Compression/ICompressionCodec.cpp
+++ b/src/Compression/ICompressionCodec.cpp
@@ -6,6 +6,7 @@
 #include <common/unaligned.h>
 #include <Common/Exception.h>
 #include <Parsers/queryToString.h>
+#include <Parsers/ASTIdentifier.h>
 
 
 namespace DB
@@ -15,24 +16,56 @@ namespace ErrorCodes
 {
     extern const int CANNOT_DECOMPRESS;
     extern const int CORRUPTED_DATA;
+    extern const int LOGICAL_ERROR;
 }
 
-ASTPtr ICompressionCodec::getFullCodecDesc() const
+
+void ICompressionCodec::setCodecDescription(const String & codec_name, const ASTs & arguments)
 {
     std::shared_ptr<ASTFunction> result = std::make_shared<ASTFunction>();
     result->name = "CODEC";
-    ASTPtr codec_desc = getCodecDesc();
-    if (codec_desc->as<ASTExpressionList>())
+
+    if (codec_name.empty())
     {
+        ASTPtr codec_desc = std::make_shared<ASTExpressionList>();
+        for (const auto & argument : arguments)
+            codec_desc->children.push_back(argument);
         result->arguments = codec_desc;
     }
     else
     {
+        ASTPtr codec_desc;
+        if (arguments.empty())
+            codec_desc = std::make_shared<ASTIdentifier>(codec_name);
+        else
+            codec_desc = makeASTFunction(codec_name, arguments);
+
         result->arguments = std::make_shared<ASTExpressionList>();
         result->arguments->children.push_back(codec_desc);
     }
+
     result->children.push_back(result->arguments);
-    return result;
+    full_codec_desc = result;
+}
+
+
+ASTPtr ICompressionCodec::getFullCodecDesc() const
+{
+    if (full_codec_desc == nullptr)
+        throw Exception("Codec description is not prepared", ErrorCodes::LOGICAL_ERROR);
+
+    return full_codec_desc;
+}
+
+
+ASTPtr ICompressionCodec::getCodecDesc() const
+{
+
+    auto arguments = getFullCodecDesc()->as<ASTFunction>()->arguments;
+    if (arguments->children.size() == 1)
+        return arguments->children[0];
+    else
+        return arguments;
 }
 
 UInt64 ICompressionCodec::getHash() const
diff --git a/src/Compression/ICompressionCodec.h b/src/Compression/ICompressionCodec.h
index 8f72ba55200..44b7aca43e1 100644
--- a/src/Compression/ICompressionCodec.h
+++ b/src/Compression/ICompressionCodec.h
@@ -31,7 +31,7 @@ public:
     virtual uint8_t getMethodByte() const = 0;
 
     /// Codec description, for example "ZSTD(2)" or "LZ4,LZ4HC(5)"
-    virtual ASTPtr getCodecDesc() const = 0;
+    virtual ASTPtr getCodecDesc() const;
 
     /// Codec description with "CODEC" prefix, for example "CODEC(ZSTD(2))" or
     /// "CODEC(LZ4,LZ4HC(5))"
@@ -87,6 +87,11 @@ protected:
 
     /// Actually decompress data without header
     virtual void doDecompressData(const char * source, UInt32 source_size, char * dest, UInt32 uncompressed_size) const = 0;
+
+    void setCodecDescription(const String & name, const ASTs & arguments = {});
+
+private:
+    ASTPtr full_codec_desc;
 };
 
 }
diff --git a/src/Storages/MergeTree/MergeSelector.h b/src/Storages/MergeTree/MergeSelector.h
index 9c043005312..e460b8ae06a 100644
--- a/src/Storages/MergeTree/MergeSelector.h
+++ b/src/Storages/MergeTree/MergeSelector.h
@@ -44,7 +44,7 @@ public:
 
         /// Information about different TTLs for part. Can be used by
         /// TTLSelector to assign merges with TTL.
-        MergeTreeDataPartTTLInfos ttl_infos;
+        const MergeTreeDataPartTTLInfos * ttl_infos;
 
         /// Part compression codec definition.
         ASTPtr compression_codec_desc;
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index 99be79390be..609869e5590 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -272,7 +272,7 @@ bool MergeTreeDataMergerMutator::selectPartsToMerge(
         part_info.age = current_time - part->modification_time;
         part_info.level = part->info.level;
         part_info.data = &part;
-        part_info.ttl_infos = part->ttl_infos;
+        part_info.ttl_infos = &part->ttl_infos;
         part_info.compression_codec_desc = part->default_codec->getFullCodecDesc();
 
         parts_ranges.back().emplace_back(part_info);
diff --git a/src/Storages/MergeTree/TTLMergeSelector.cpp b/src/Storages/MergeTree/TTLMergeSelector.cpp
index 1defc60d8bc..7f76da085c9 100644
--- a/src/Storages/MergeTree/TTLMergeSelector.cpp
+++ b/src/Storages/MergeTree/TTLMergeSelector.cpp
@@ -94,12 +94,12 @@ IMergeSelector::PartsRange ITTLMergeSelector::select(
 
 time_t TTLDeleteMergeSelector::getTTLForPart(const IMergeSelector::Part & part) const
 {
-    return only_drop_parts ? part.ttl_infos.part_max_ttl : part.ttl_infos.part_min_ttl;
+    return only_drop_parts ? part.ttl_infos->part_max_ttl : part.ttl_infos->part_min_ttl;
 }
 
 time_t TTLRecompressMergeSelector::getTTLForPart(const IMergeSelector::Part & part) const
 {
-    return part.ttl_infos.getMinimalMaxRecompressionTTL();
+    return part.ttl_infos->getMinimalMaxRecompressionTTL();
 }
 
 bool TTLRecompressMergeSelector::isTTLAlreadySatisfied(const IMergeSelector::Part & part) const
@@ -107,7 +107,7 @@ bool TTLRecompressMergeSelector::isTTLAlreadySatisfied(const IMergeSelector::Par
     if (recompression_ttls.empty())
         return false;
 
-    auto ttl_description = selectTTLDescriptionForTTLInfos(recompression_ttls, part.ttl_infos.recompression_ttl, current_time, true);
+    auto ttl_description = selectTTLDescriptionForTTLInfos(recompression_ttls, part.ttl_infos->recompression_ttl, current_time, true);
 
     if (!ttl_description)
         return true;

From 7aa3f86ab9534838dce6786947f4bc78e3c4dda2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Mon, 14 Sep 2020 22:44:20 +0300
Subject: [PATCH 205/341] Added config.d file for development

---
 programs/server/config.d/access_control.xml | 13 +++++++++++++
 1 file changed, 13 insertions(+)
 create mode 100644 programs/server/config.d/access_control.xml

diff --git a/programs/server/config.d/access_control.xml b/programs/server/config.d/access_control.xml
new file mode 100644
index 00000000000..6567c39f171
--- /dev/null
+++ b/programs/server/config.d/access_control.xml
@@ -0,0 +1,13 @@
+<yandex>
+    <!-- Sources to read users, roles, access rights, profiles of settings, quotas. -->
+    <user_directories replace="replace">
+        <users_xml>
+            <!-- Path to configuration file with predefined users. -->
+            <path>users.xml</path>
+        </users_xml>
+        <local_directory>
+            <!-- Path to folder where users created by SQL commands are stored. -->
+            <path>access/</path>
+        </local_directory>
+    </user_directories>
+</yandex>

From 14393a33293c55cbe2191d503ae2ffbe42af3e6a Mon Sep 17 00:00:00 2001
From: Vladimir Golovchenko <vladimirg@pressreader.com>
Date: Sun, 13 Sep 2020 17:22:02 -0700
Subject: [PATCH 206/341] Fixed the wrong version of SQL standard.

---
 docs/en/sql-reference/ansi.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/ansi.md b/docs/en/sql-reference/ansi.md
index 805741ba9d5..4dbd7a67544 100644
--- a/docs/en/sql-reference/ansi.md
+++ b/docs/en/sql-reference/ansi.md
@@ -6,7 +6,7 @@ toc_title: ANSI Compatibility
 # ANSI SQL Compatibility of ClickHouse SQL Dialect {#ansi-sql-compatibility-of-clickhouse-sql-dialect}
 
 !!! note "Note"
-    This article relies on Table 38, “Feature taxonomy and definition for mandatory features”, Annex F of ISO/IEC CD 9075-2:2013.
+    This article relies on Table 38, “Feature taxonomy and definition for mandatory features”, Annex F of [ISO/IEC CD 9075-2:2011](https://www.iso.org/obp/ui/#iso:std:iso-iec:9075:-2:ed-4:v1:en:sec:8).
 
 ## Differences in Behaviour {#differences-in-behaviour}
 

From eb0c1714fe2a01366d16cbd707ab2964b042a2d9 Mon Sep 17 00:00:00 2001
From: Vladimir Golovchenko <vladimirg@pressreader.com>
Date: Mon, 14 Sep 2020 12:32:51 -0700
Subject: [PATCH 207/341] Extended section E081 according to SQL:2011.

---
 docs/en/sql-reference/ansi.md | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/docs/en/sql-reference/ansi.md b/docs/en/sql-reference/ansi.md
index 4dbd7a67544..6096e090623 100644
--- a/docs/en/sql-reference/ansi.md
+++ b/docs/en/sql-reference/ansi.md
@@ -77,6 +77,16 @@ The following table lists cases when query feature works in ClickHouse, but beha
 | E071-05    | Columns combined via table operators need not have exactly the same data type                                            | Yes{.text-success}         |                                                                                                                                                                                           |
 | E071-06    | Table operators in subqueries                                                                                            | Yes{.text-success}         |                                                                                                                                                                                           |
 | **E081**   | **Basic privileges**                                                                                                     | **Partial**{.text-warning} | Work in progress                                                                                                                                                                          |
+| E081-01    | SELECT privilege at the table level | | |
+| E081-02    | DELETE privilege | | |
+| E081-03    | INSERT privilege at the table level | | |
+| E081-04    | UPDATE privilege at the table level | | |
+| E081-05    | UPDATE privilege at the column level | | |
+| E081-06    | REFERENCES privilege at the table level | | |
+| E081-07    | REFERENCES privilege at the column level | | |
+| E081-08    | WITH GRANT OPTION | | |
+| E081-09    | USAGE privilege | | |
+| E081-10    | EXECUTE privilege | | |
 | **E091**   | **Set functions**                                                                                                        | **Yes**{.text-success}     |                                                                                                                                                                                           |
 | E091-01    | AVG                                                                                                                      | Yes{.text-success}         |                                                                                                                                                                                           |
 | E091-02    | COUNT                                                                                                                    | Yes{.text-success}         |                                                                                                                                                                                           |

From adbd24041733d3098a8308d38bc65b7849da69f2 Mon Sep 17 00:00:00 2001
From: Vladimir Golovchenko <vladimirg@pressreader.com>
Date: Mon, 14 Sep 2020 12:42:54 -0700
Subject: [PATCH 208/341] Added missed section S011 according to SQL:2011.

---
 docs/en/sql-reference/ansi.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/en/sql-reference/ansi.md b/docs/en/sql-reference/ansi.md
index 6096e090623..2cd9142c2f9 100644
--- a/docs/en/sql-reference/ansi.md
+++ b/docs/en/sql-reference/ansi.md
@@ -179,6 +179,7 @@ The following table lists cases when query feature works in ClickHouse, but beha
 | **F471**   | **Scalar subquery values**                                                                                               | **Yes**{.text-success}     |                                                                                                                                                                                           |
 | **F481**   | **Expanded NULL predicate**                                                                                              | **Yes**{.text-success}     |                                                                                                                                                                                           |
 | **F812**   | **Basic flagging**                                                                                                       | **No**{.text-danger}       |                                                                                                                                                                                           |
+| **S011**   | **Distinct data types** | | |
 | **T321**   | **Basic SQL-invoked routines**                                                                                           | **No**{.text-danger}       |                                                                                                                                                                                           |
 | T321-01    | User-defined functions with no overloading                                                                               | No{.text-danger}           |                                                                                                                                                                                           |
 | T321-02    | User-defined stored procedures with no overloading                                                                       | No{.text-danger}           |                                                                                                                                                                                           |

From d09422e60f8bda24e5cfc2c499598f7b3cdbf493 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 22:49:46 +0300
Subject: [PATCH 209/341] Fix build.

---
 src/DataStreams/LocalLimits.h | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/DataStreams/LocalLimits.h b/src/DataStreams/LocalLimits.h
index 454721a307f..a82c93f1894 100644
--- a/src/DataStreams/LocalLimits.h
+++ b/src/DataStreams/LocalLimits.h
@@ -1,3 +1,4 @@
+#pragma once
 #include <DataStreams/SizeLimits.h>
 #include <DataStreams/ExecutionSpeedLimits.h>
 

From 45098f7112eb829ad2bb36e7bfe90827bedba2d7 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 23:32:38 +0300
Subject: [PATCH 210/341] Fix build.

---
 src/Functions/GatherUtils/Algorithms.h | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index 64380e5cd53..d3fa018e3d5 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -25,7 +25,7 @@ inline constexpr size_t MAX_ARRAY_SIZE = 1 << 30;
 /// Methods to copy Slice to Sink, overloaded for various combinations of types.
 
 template <typename T>
-void ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<T> & sink)
+void inline ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<T> & sink)
 {
     sink.elements.resize(sink.current_offset + slice.size);
     memcpySmallAllowReadWriteOverflow15(&sink.elements[sink.current_offset], slice.data, slice.size * sizeof(T));
@@ -33,7 +33,7 @@ void ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySi
 }
 
 template <typename T, typename U>
-void ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<U> & sink)
+void inline ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<U> & sink)
 {
     using NativeU = typename NativeType<U>::Type;
 
@@ -395,7 +395,7 @@ void ALWAYS_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink, const
 
 
 template <typename SourceA, typename SourceB, typename Sink>
-void ALWAYS_INLINE conditional(SourceA && src_a, SourceB && src_b, Sink && sink, const PaddedPODArray<UInt8> & condition)
+void inline ALWAYS_INLINE conditional(SourceA && src_a, SourceB && src_b, Sink && sink, const PaddedPODArray<UInt8> & condition)
 {
     sink.reserve(std::max(src_a.getSizeForReserve(), src_b.getSizeForReserve()));
 

From 9fcfa560aec891ff92c8b43e2a13b96867866191 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 23:35:45 +0300
Subject: [PATCH 211/341] Try simplify Visitor.

---
 src/Common/Visitor.h | 18 ++++++++++++------
 1 file changed, 12 insertions(+), 6 deletions(-)

diff --git a/src/Common/Visitor.h b/src/Common/Visitor.h
index 7aef573a566..a6b776580a7 100644
--- a/src/Common/Visitor.h
+++ b/src/Common/Visitor.h
@@ -65,8 +65,6 @@ class Visitor<>
 {
 public:
     using List = TypeList<>;
-
-    virtual ~Visitor() = default;
 };
 
 template <typename Type>
@@ -75,7 +73,11 @@ class Visitor<Type> : public Visitor<>
 public:
     using List = TypeList<Type>;
 
-    virtual void visit(Type &) = 0;
+    void visit(Type &)
+    {
+        throw Exception("visit(" + demangle(typeid(Type).name()) + " &)" + " is not implemented for class"
+                        + demangle(typeid(Visitor<Type>).name()), ErrorCodes::LOGICAL_ERROR);
+    }
 };
 
 template <typename Type, typename ... Types>
@@ -85,7 +87,11 @@ public:
     using List = TypeList<Type, Types ...>;
     using Visitor<Types ...>::visit;
 
-    virtual void visit(Type &) = 0;
+    void visit(Type &)
+    {
+        throw Exception("visit(" + demangle(typeid(Type).name()) + " &)" + " is not implemented for class"
+                        + demangle(typeid(Visitor<Type>).name()), ErrorCodes::LOGICAL_ERROR);
+    }
 };
 
 
@@ -102,7 +108,7 @@ class VisitorImplHelper<Derived, VisitorBase, Type> : public VisitorBase
 {
 public:
     using VisitorBase::visit;
-    void visit(Type & value) override { static_cast<Derived *>(this)->visitImpl(value); }
+    void visit(Type & value) { static_cast<Derived *>(this)->visitImpl(value); }
 
 protected:
     template <typename T>
@@ -119,7 +125,7 @@ class VisitorImplHelper<Derived, VisitorBase, Type, Types ...>
 {
 public:
     using VisitorImplHelper<Derived, VisitorBase, Types ...>::visit;
-    void visit(Type & value) override { static_cast<Derived *>(this)->visitImpl(value); }
+    void visit(Type & value) { static_cast<Derived *>(this)->visitImpl(value); }
 
 protected:
     template <typename T>

From 1b618fd130b31f6cbeda910fcbd655a29dab08d8 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 14 Sep 2020 23:56:56 +0300
Subject: [PATCH 212/341] Fix build

---
 src/DataStreams/IBlockInputStream.cpp | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/DataStreams/IBlockInputStream.cpp b/src/DataStreams/IBlockInputStream.cpp
index 94f7544480a..e954225fdf9 100644
--- a/src/DataStreams/IBlockInputStream.cpp
+++ b/src/DataStreams/IBlockInputStream.cpp
@@ -63,7 +63,7 @@ Block IBlockInputStream::read()
         if (enabled_extremes)
             updateExtremes(res);
 
-        if (limits.mode == LIMITS_CURRENT && !limits.size_limits.check(info.rows, info.bytes, "result", ErrorCodes::TOO_MANY_ROWS_OR_BYTES))
+        if (limits.mode == LimitsMode::LIMITS_CURRENT && !limits.size_limits.check(info.rows, info.bytes, "result", ErrorCodes::TOO_MANY_ROWS_OR_BYTES))
             limit_exceeded_need_break = true;
 
         if (quota)
@@ -209,11 +209,11 @@ void IBlockInputStream::checkQuota(Block & block)
 {
     switch (limits.mode)
     {
-        case LIMITS_TOTAL:
+        case LimitsMode::LIMITS_TOTAL:
             /// Checked in `progress` method.
             break;
 
-        case LIMITS_CURRENT:
+        case LimitsMode::LIMITS_CURRENT:
         {
             UInt64 total_elapsed = info.total_stopwatch.elapsedNanoseconds();
             quota->used({Quota::RESULT_ROWS, block.rows()}, {Quota::RESULT_BYTES, block.bytes()}, {Quota::EXECUTION_TIME, total_elapsed - prev_elapsed});
@@ -242,7 +242,7 @@ void IBlockInputStream::progressImpl(const Progress & value)
         /** Check the restrictions on the amount of data to read, the speed of the query, the quota on the amount of data to read.
             * NOTE: Maybe it makes sense to have them checked directly in ProcessList?
             */
-        if (limits.mode == LIMITS_TOTAL)
+        if (limits.mode == LimitsMode::LIMITS_TOTAL)
         {
             if (!limits.size_limits.check(total_rows_estimate, progress.read_bytes, "rows to read",
                                          ErrorCodes::TOO_MANY_ROWS, ErrorCodes::TOO_MANY_BYTES))
@@ -262,7 +262,7 @@ void IBlockInputStream::progressImpl(const Progress & value)
 
         limits.speed_limits.throttle(progress.read_rows, progress.read_bytes, total_rows, total_elapsed_microseconds);
 
-        if (quota && limits.mode == LIMITS_TOTAL)
+        if (quota && limits.mode == LimitsMode::LIMITS_TOTAL)
             quota->used({Quota::READ_ROWS, value.read_rows}, {Quota::READ_BYTES, value.read_bytes});
     }
 

From 31660ddb4dc8906d23680750f11001aed5b37ca2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 00:30:55 +0300
Subject: [PATCH 213/341] Fix build

---
 src/Processors/QueryPlan/PartialSortingStep.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Processors/QueryPlan/PartialSortingStep.cpp b/src/Processors/QueryPlan/PartialSortingStep.cpp
index 4b8b35cd3e2..8014445b899 100644
--- a/src/Processors/QueryPlan/PartialSortingStep.cpp
+++ b/src/Processors/QueryPlan/PartialSortingStep.cpp
@@ -57,7 +57,7 @@ void PartialSortingStep::transformPipeline(QueryPipeline & pipeline)
     });
 
     LocalLimits limits;
-    limits.mode = IBlockInputStream::LIMITS_CURRENT;
+    limits.mode = LimitsMode::LIMITS_CURRENT;
     limits.size_limits = size_limits;
 
     pipeline.addSimpleTransform([&](const Block & header, QueryPipeline::StreamType stream_type) -> ProcessorPtr

From 65a1057aae98cfdff88883351d0af697112e060f Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 00:40:41 +0300
Subject: [PATCH 214/341] Revert "Try simplify Visitor."

This reverts commit 9fcfa560aec891ff92c8b43e2a13b96867866191.
---
 src/Common/Visitor.h | 18 ++++++------------
 1 file changed, 6 insertions(+), 12 deletions(-)

diff --git a/src/Common/Visitor.h b/src/Common/Visitor.h
index a6b776580a7..7aef573a566 100644
--- a/src/Common/Visitor.h
+++ b/src/Common/Visitor.h
@@ -65,6 +65,8 @@ class Visitor<>
 {
 public:
     using List = TypeList<>;
+
+    virtual ~Visitor() = default;
 };
 
 template <typename Type>
@@ -73,11 +75,7 @@ class Visitor<Type> : public Visitor<>
 public:
     using List = TypeList<Type>;
 
-    void visit(Type &)
-    {
-        throw Exception("visit(" + demangle(typeid(Type).name()) + " &)" + " is not implemented for class"
-                        + demangle(typeid(Visitor<Type>).name()), ErrorCodes::LOGICAL_ERROR);
-    }
+    virtual void visit(Type &) = 0;
 };
 
 template <typename Type, typename ... Types>
@@ -87,11 +85,7 @@ public:
     using List = TypeList<Type, Types ...>;
     using Visitor<Types ...>::visit;
 
-    void visit(Type &)
-    {
-        throw Exception("visit(" + demangle(typeid(Type).name()) + " &)" + " is not implemented for class"
-                        + demangle(typeid(Visitor<Type>).name()), ErrorCodes::LOGICAL_ERROR);
-    }
+    virtual void visit(Type &) = 0;
 };
 
 
@@ -108,7 +102,7 @@ class VisitorImplHelper<Derived, VisitorBase, Type> : public VisitorBase
 {
 public:
     using VisitorBase::visit;
-    void visit(Type & value) { static_cast<Derived *>(this)->visitImpl(value); }
+    void visit(Type & value) override { static_cast<Derived *>(this)->visitImpl(value); }
 
 protected:
     template <typename T>
@@ -125,7 +119,7 @@ class VisitorImplHelper<Derived, VisitorBase, Type, Types ...>
 {
 public:
     using VisitorImplHelper<Derived, VisitorBase, Types ...>::visit;
-    void visit(Type & value) { static_cast<Derived *>(this)->visitImpl(value); }
+    void visit(Type & value) override { static_cast<Derived *>(this)->visitImpl(value); }
 
 protected:
     template <typename T>

From 65e48663e7b6c891f35a4f01c8122f7630fad757 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 11 Aug 2020 08:10:00 +0300
Subject: [PATCH 215/341] Drop policy on start in
 01308_row_policy_and_trivial_count_query

---
 .../0_stateless/01308_row_policy_and_trivial_count_query.sql     | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/01308_row_policy_and_trivial_count_query.sql b/tests/queries/0_stateless/01308_row_policy_and_trivial_count_query.sql
index c105885cb60..cd41bb227eb 100644
--- a/tests/queries/0_stateless/01308_row_policy_and_trivial_count_query.sql
+++ b/tests/queries/0_stateless/01308_row_policy_and_trivial_count_query.sql
@@ -4,6 +4,7 @@ CREATE TABLE t (x UInt8) ENGINE = MergeTree ORDER BY x;
 INSERT INTO t VALUES (1), (2), (3);
 
 SELECT count() FROM t;
+DROP ROW POLICY IF EXISTS filter ON t;
 CREATE ROW POLICY filter ON t USING (x % 2 = 1) TO ALL;
 SELECT count() FROM t;
 DROP ROW POLICY filter ON t;

From 2fce2b21a85a90c0a9734ca692f5df97ab1565b3 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 12 Aug 2020 01:15:38 +0300
Subject: [PATCH 216/341] Use pytest.raises(match=) in
 test_allowed_client_hosts

Since pytest.raises() produces excinfo not exception, hence at least
str(excinfo.value) should be used to match the exception message.
---
 tests/integration/test_allowed_client_hosts/test.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/tests/integration/test_allowed_client_hosts/test.py b/tests/integration/test_allowed_client_hosts/test.py
index f187b6d889c..1f4ef03e1ac 100644
--- a/tests/integration/test_allowed_client_hosts/test.py
+++ b/tests/integration/test_allowed_client_hosts/test.py
@@ -60,7 +60,5 @@ def test_allowed_host():
         assert query_from_one_node_to_another(client_node, server, "SELECT * FROM test_table") == "5\n"
 
     for client_node in expected_to_fail:
-        with pytest.raises(Exception) as e:
-            result = query_from_one_node_to_another(client_node, server, "SELECT * FROM test_table")
-            print("Client node: {} Server node: {} Result: {}".format(client_node, server_node, result))
-        assert "default: Authentication failed" in str(e)
+        with pytest.raises(Exception, match=r'default: Authentication failed'):
+            query_from_one_node_to_another(client_node, server, "SELECT * FROM test_table")

From d53bbd3394c456afb0bd8321d5fe4b10dbb0b1e3 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 27 Aug 2020 01:43:47 +0300
Subject: [PATCH 217/341] Not only send the exception to the client but also
 log it

Otherwise there will be only tricky "Unknown packet" exception after
exception during handling INSERT queries.
---
 src/Server/TCPHandler.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index e4dcfce9102..6694a9d6950 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -351,6 +351,8 @@ void TCPHandler::runImpl()
                     tryLogCurrentException(log, "Can't send logs to client");
                 }
 
+                const auto & e = *exception;
+                LOG_ERROR(log, "Code: {}, e.displayText() = {}, Stack trace:\n\n{}", e.code(), e.displayText(), e.getStackTraceString());
                 sendException(*exception, send_exception_with_stack_trace);
             }
         }

From ec9d7745f38c6210c978cd2d56a3eed93422cea6 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 27 Aug 2020 03:00:43 +0300
Subject: [PATCH 218/341] Break the query loop on UNEXPECTED_PACKET_FROM_CLIENT

---
 src/Server/TCPHandler.cpp | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index 6694a9d6950..6ac433f8497 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -293,6 +293,12 @@ void TCPHandler::runImpl()
             if (e.code() == ErrorCodes::UNKNOWN_PACKET_FROM_CLIENT)
                 throw;
 
+            /// If there is UNEXPECTED_PACKET_FROM_CLIENT emulate network_error
+            /// to break the loop, but do not throw to send the exception to
+            /// the client.
+            if (e.code() == ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT)
+                network_error = true;
+
             /// If a timeout occurred, try to inform client about it and close the session
             if (e.code() == ErrorCodes::SOCKET_TIMEOUT)
                 network_error = true;

From 0159c74f217ec764060c480819e3ccc9d5a99a63 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 15 Sep 2020 00:55:43 +0300
Subject: [PATCH 219/341] Secure inter-cluster query execution (with
 initial_user as current query user) [v3]

Add inter-server cluster secret, it is used for Distributed queries
inside cluster, you can configure in the configuration file:

  <remote_servers>
      <logs>
          <shard>
              <secret>foobar</secret> <!-- empty -- works as before -->
              ...
          </shard>
      </logs>
  </remote_servers>

And this will allow clickhouse to make sure that the query was not
faked, and was issued from the node that knows the secret. And since
trust appeared it can use initial_user for query execution, this will
apply correct *_for_user (since with inter-server secret enabled, the
query will be executed from the same user on the shards as on initator,
unlike "default" user w/o it).

v2: Change user to the initial_user for Distributed queries if secret match
v3: Add Protocol::Cluster package
v4: Drop Protocol::Cluster and use plain Protocol::Hello + user marker
v5: Do not use user from Hello for cluster-secure (superfluous)
---
 .../table-engines/special/distributed.md      |  12 ++
 programs/benchmark/Benchmark.cpp              |   7 +-
 programs/client/Client.cpp                    |   2 +
 programs/client/Suggest.cpp                   |   2 +
 programs/server/config.xml                    |  22 +++
 src/Client/Connection.cpp                     |  74 ++++++++-
 src/Client/Connection.h                       |  13 ++
 src/Client/ConnectionPool.h                   |   9 ++
 src/Core/Defines.h                            |   5 +-
 src/Core/Protocol.h                           |  40 ++++-
 .../ClickHouseDictionarySource.cpp            |   2 +
 src/Interpreters/Cluster.cpp                  |  66 ++++++--
 src/Interpreters/Cluster.h                    |  25 ++-
 src/Interpreters/Context.cpp                  |  16 +-
 src/Interpreters/Context.h                    |   8 +
 src/Server/TCPHandler.cpp                     | 122 ++++++++++++--
 src/Server/TCPHandler.h                       |   9 +-
 src/Storages/Distributed/DirectoryMonitor.cpp |  13 +-
 .../__init__.py                               |   0
 .../configs/remote_servers.xml                |  26 +++
 .../configs/remote_servers_n1.xml             |  15 ++
 .../configs/remote_servers_n2.xml             |  15 ++
 .../configs/users.xml                         |  41 +++++
 .../test.py                                   | 152 ++++++++++++++++++
 24 files changed, 642 insertions(+), 54 deletions(-)
 create mode 100644 tests/integration/test_distributed_inter_server_secret/__init__.py
 create mode 100644 tests/integration/test_distributed_inter_server_secret/configs/remote_servers.xml
 create mode 100644 tests/integration/test_distributed_inter_server_secret/configs/remote_servers_n1.xml
 create mode 100644 tests/integration/test_distributed_inter_server_secret/configs/remote_servers_n2.xml
 create mode 100644 tests/integration/test_distributed_inter_server_secret/configs/users.xml
 create mode 100644 tests/integration/test_distributed_inter_server_secret/test.py

diff --git a/docs/en/engines/table-engines/special/distributed.md b/docs/en/engines/table-engines/special/distributed.md
index f03ee25f3b3..b1d741e9e13 100644
--- a/docs/en/engines/table-engines/special/distributed.md
+++ b/docs/en/engines/table-engines/special/distributed.md
@@ -45,6 +45,18 @@ Clusters are set like this:
 <remote_servers>
     <logs>
         <shard>
+            <!-- Inter-server per-cluster secret for Distributed queries
+                 default: no secret (no authentication will be performed)
+
+                 If set, then Distributed queries will be validated on shards, so at least:
+                 - such cluster should exist on the shard,
+                 - such cluster should have the same secret.
+
+                 And also (and which is more important), the initial_user will
+                 be used as current user for the query.
+            -->
+            <!-- <secret></secret> -->
+
             <!-- Optional. Shard weight when writing data. Default: 1. -->
             <weight>1</weight>
             <!-- Optional. Whether to write data to just one of the replicas. Default: false (write data to all replicas). -->
diff --git a/programs/benchmark/Benchmark.cpp b/programs/benchmark/Benchmark.cpp
index c8fdde3d3a6..08ded9ed870 100644
--- a/programs/benchmark/Benchmark.cpp
+++ b/programs/benchmark/Benchmark.cpp
@@ -85,7 +85,12 @@ public:
             std::string cur_host = i >= hosts_.size() ? "localhost" : hosts_[i];
 
             connections.emplace_back(std::make_unique<ConnectionPool>(
-                concurrency, cur_host, cur_port, default_database_, user_, password_, "benchmark", Protocol::Compression::Enable, secure));
+                concurrency,
+                cur_host, cur_port,
+                default_database_, user_, password_,
+                "", /* cluster */
+                "", /* cluster_secret */
+                "benchmark", Protocol::Compression::Enable, secure));
             comparison_info_per_interval.emplace_back(std::make_shared<Stats>());
             comparison_info_total.emplace_back(std::make_shared<Stats>());
         }
diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 139a5b367e4..38fcc459cce 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -701,6 +701,8 @@ private:
             connection_parameters.default_database,
             connection_parameters.user,
             connection_parameters.password,
+            "", /* cluster */
+            "", /* cluster_secret */
             "client",
             connection_parameters.compression,
             connection_parameters.security);
diff --git a/programs/client/Suggest.cpp b/programs/client/Suggest.cpp
index 738697817c3..ac18a131c3a 100644
--- a/programs/client/Suggest.cpp
+++ b/programs/client/Suggest.cpp
@@ -26,6 +26,8 @@ void Suggest::load(const ConnectionParameters & connection_parameters, size_t su
                     connection_parameters.default_database,
                     connection_parameters.user,
                     connection_parameters.password,
+                    "" /* cluster */,
+                    "" /* cluster_secret */,
                     "client",
                     connection_parameters.compression,
                     connection_parameters.security);
diff --git a/programs/server/config.xml b/programs/server/config.xml
index 3d7ebf0cd96..5736b2012d3 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -308,6 +308,28 @@
     <remote_servers incl="clickhouse_remote_servers" >
         <!-- Test only shard config for testing distributed storage -->
         <test_shard_localhost>
+            <!-- Inter-server per-cluster secret for Distributed queries
+                 default: no secret (no authentication will be performed)
+
+                 If set, then Distributed queries will be validated on shards, so at least:
+                 - such cluster should exist on the shard,
+                 - such cluster should have the same secret.
+
+                 And also (and which is more important), the initial_user will
+                 be used as current user for the query.
+
+                 Right now the protocol is pretty simple and it only takes into account:
+                 - cluster name
+                 - query
+
+                 Also it will be nice if the following will be implemented:
+                 - source hostname (see interserver_http_host), but then it will depends from DNS,
+                   it can use IP address instead, but then the you need to get correct on the initiator node.
+                 - target hostname / ip address (same notes as for source hostname)
+                 - time-based security tokens
+            -->
+            <!-- <secret></secret> -->
+
             <shard>
                 <!-- Optional. Whether to write data to just one of the replicas. Default: false (write data to all replicas). -->
                 <!-- <internal_replication>false</internal_replication> -->
diff --git a/src/Client/Connection.cpp b/src/Client/Connection.cpp
index ed27a878b5a..a52dcf66efb 100644
--- a/src/Client/Connection.cpp
+++ b/src/Client/Connection.cpp
@@ -17,12 +17,15 @@
 #include <Common/CurrentMetrics.h>
 #include <Common/DNSResolver.h>
 #include <Common/StringUtils/StringUtils.h>
+#include <Common/OpenSSLHelpers.h>
+#include <Common/randomSeed.h>
 #include <Interpreters/ClientInfo.h>
 #include <Compression/CompressionFactory.h>
 #include <Processors/Pipe.h>
 #include <Processors/ISink.h>
 #include <Processors/Executors/PipelineExecutor.h>
 #include <Processors/ConcatProcessor.h>
+#include <pcg_random.hpp>
 
 #if !defined(ARCADIA_BUILD)
 #    include <Common/config_version.h>
@@ -171,8 +174,26 @@ void Connection::sendHello()
     // NOTE For backward compatibility of the protocol, client cannot send its version_patch.
     writeVarUInt(client_revision, *out);
     writeStringBinary(default_database, *out);
-    writeStringBinary(user, *out);
-    writeStringBinary(password, *out);
+    /// If interserver-secret is used, one do not need password
+    /// (NOTE we do not check for DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET, since we cannot ignore inter-server secret if it was requested)
+    if (!cluster_secret.empty())
+    {
+        writeStringBinary(USER_INTERSERVER_MARKER, *out);
+        writeStringBinary("" /* password */, *out);
+
+#if USE_SSL
+        sendClusterNameAndSalt();
+#else
+        throw Exception(
+            "Inter-server secret support is disabled, because ClickHouse was built without SSL library",
+            ErrorCodes::SUPPORT_IS_DISABLED);
+#endif
+    }
+    else
+    {
+        writeStringBinary(user, *out);
+        writeStringBinary(password, *out);
+    }
 
     out->next();
 }
@@ -288,6 +309,22 @@ void Connection::forceConnected(const ConnectionTimeouts & timeouts)
     }
 }
 
+#if USE_SSL
+void Connection::sendClusterNameAndSalt()
+{
+    salt.clear();
+    pcg64_fast rng(randomSeed());
+    UInt64 rand = rng();
+    std::string_view data(reinterpret_cast<char *>(&rand), sizeof(rand));
+
+    salt.resize(32);
+    encodeSHA256(data, reinterpret_cast<unsigned char *>(salt.data()));
+
+    writeStringBinary(cluster, *out);
+    writeStringBinary(salt, *out);
+}
+#endif
+
 bool Connection::ping()
 {
     // LOG_TRACE(log_wrapper.get(), "Ping");
@@ -406,6 +443,39 @@ void Connection::sendQuery(
     else
         writeStringBinary("" /* empty string is a marker of the end of settings */, *out);
 
+    /// Interserver secret
+    if (server_revision >= DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET)
+    {
+        /// Hash
+        ///
+        /// Send correct hash only for !INITIAL_QUERY, due to:
+        /// - this will avoid extra protocol complexity for simplest cases
+        /// - there is no need in hash for the INITIAL_QUERY anyway
+        ///   (since there is no secure/unsecure changes)
+        if (client_info && !cluster_secret.empty() && client_info->query_kind != ClientInfo::QueryKind::INITIAL_QUERY)
+        {
+#if USE_SSL
+            std::string data(salt);
+            data += cluster_secret;
+            data += query;
+            data += query_id;
+            data += client_info->initial_user;
+            /// TODO: add source/target host/ip-address
+
+            std::string hash;
+            hash.resize(32);
+            encodeSHA256(data, reinterpret_cast<unsigned char *>(hash.data()));
+            writeStringBinary(hash, *out);
+#else
+        throw Exception(
+            "Inter-server secret support is disabled, because ClickHouse was built without SSL library",
+            ErrorCodes::SUPPORT_IS_DISABLED);
+#endif
+        }
+        else
+            writeStringBinary("", *out);
+    }
+
     writeVarUInt(stage, *out);
     writeVarUInt(static_cast<bool>(compression), *out);
 
diff --git a/src/Client/Connection.h b/src/Client/Connection.h
index 7019778a2c9..f4c25001f3e 100644
--- a/src/Client/Connection.h
+++ b/src/Client/Connection.h
@@ -83,6 +83,8 @@ public:
     Connection(const String & host_, UInt16 port_,
         const String & default_database_,
         const String & user_, const String & password_,
+        const String & cluster_,
+        const String & cluster_secret_,
         const String & client_name_ = "client",
         Protocol::Compression compression_ = Protocol::Compression::Enable,
         Protocol::Secure secure_ = Protocol::Secure::Disable,
@@ -90,6 +92,8 @@ public:
         :
         host(host_), port(port_), default_database(default_database_),
         user(user_), password(password_),
+        cluster(cluster_),
+        cluster_secret(cluster_secret_),
         client_name(client_name_),
         compression(compression_),
         secure(secure_),
@@ -191,6 +195,11 @@ private:
     String user;
     String password;
 
+    /// For inter-server authorization
+    String cluster;
+    String cluster_secret;
+    String salt;
+
     /// Address is resolved during the first connection (or the following reconnects)
     /// Use it only for logging purposes
     std::optional<Poco::Net::SocketAddress> current_resolved_address;
@@ -269,6 +278,10 @@ private:
     void connect(const ConnectionTimeouts & timeouts);
     void sendHello();
     void receiveHello();
+
+#if USE_SSL
+    void sendClusterNameAndSalt();
+#endif
     bool ping();
 
     Block receiveData();
diff --git a/src/Client/ConnectionPool.h b/src/Client/ConnectionPool.h
index 95cb81c8052..736075a4cc1 100644
--- a/src/Client/ConnectionPool.h
+++ b/src/Client/ConnectionPool.h
@@ -54,6 +54,8 @@ public:
             const String & default_database_,
             const String & user_,
             const String & password_,
+            const String & cluster_,
+            const String & cluster_secret_,
             const String & client_name_ = "client",
             Protocol::Compression compression_ = Protocol::Compression::Enable,
             Protocol::Secure secure_ = Protocol::Secure::Disable,
@@ -65,6 +67,8 @@ public:
         default_database(default_database_),
         user(user_),
         password(password_),
+        cluster(cluster_),
+        cluster_secret(cluster_secret_),
         client_name(client_name_),
         compression(compression_),
         secure(secure_),
@@ -109,6 +113,7 @@ protected:
         return std::make_shared<Connection>(
             host, port,
             default_database, user, password,
+            cluster, cluster_secret,
             client_name, compression, secure);
     }
 
@@ -119,6 +124,10 @@ private:
     String user;
     String password;
 
+    /// For inter-server authorization
+    String cluster;
+    String cluster_secret;
+
     String client_name;
     Protocol::Compression compression; /// Whether to compress data when interacting with the server.
     Protocol::Secure secure;           /// Whether to encrypt data when interacting with the server.
diff --git a/src/Core/Defines.h b/src/Core/Defines.h
index e244581c339..d3e2d0fd336 100644
--- a/src/Core/Defines.h
+++ b/src/Core/Defines.h
@@ -67,8 +67,11 @@
 /// Minimum revision supporting SettingsBinaryFormat::STRINGS.
 #define DBMS_MIN_REVISION_WITH_SETTINGS_SERIALIZED_AS_STRINGS 54429
 
+/// Mininum revision supporting interserver secret.
+#define DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET 54440
+
 /// Version of ClickHouse TCP protocol. Set to git tag with latest protocol change.
-#define DBMS_TCP_PROTOCOL_VERSION 54226
+#define DBMS_TCP_PROTOCOL_VERSION 54440
 
 /// The boundary on which the blocks for asynchronous file operations should be aligned.
 #define DEFAULT_AIO_FILE_BLOCK_SIZE 4096
diff --git a/src/Core/Protocol.h b/src/Core/Protocol.h
index bc97e5d47d4..87e7978959b 100644
--- a/src/Core/Protocol.h
+++ b/src/Core/Protocol.h
@@ -52,6 +52,10 @@ namespace DB
 /// Using this block the client can initialize the output formatter and display the prefix of resulting table
 /// beforehand.
 
+/// Marker of the inter-server secret (passed in the user name)
+/// (anyway user cannot be started with a whitespace)
+const char USER_INTERSERVER_MARKER[] = " INTERSERVER SECRET ";
+
 namespace Protocol
 {
     /// Packet types that server transmits.
@@ -71,6 +75,8 @@ namespace Protocol
             TablesStatusResponse = 9, /// A response to TablesStatus request.
             Log = 10,                 /// System logs of the query execution
             TableColumns = 11,        /// Columns' description for default values calculation
+
+            MAX = TableColumns,
         };
 
         /// NOTE: If the type of packet argument would be Enum, the comparison packet >= 0 && packet < 10
@@ -79,9 +85,21 @@ namespace Protocol
         /// See https://www.securecoding.cert.org/confluence/display/cplusplus/INT36-CPP.+Do+not+use+out-of-range+enumeration+values
         inline const char * toString(UInt64 packet)
         {
-            static const char * data[] = { "Hello", "Data", "Exception", "Progress", "Pong", "EndOfStream", "ProfileInfo", "Totals",
-                "Extremes", "TablesStatusResponse", "Log", "TableColumns" };
-            return packet < 12
+            static const char * data[] = {
+                "Hello",
+                "Data",
+                "Exception",
+                "Progress",
+                "Pong",
+                "EndOfStream",
+                "ProfileInfo",
+                "Totals",
+                "Extremes",
+                "TablesStatusResponse",
+                "Log",
+                "TableColumns",
+            };
+            return packet <= MAX
                 ? data[packet]
                 : "Unknown packet";
         }
@@ -113,13 +131,23 @@ namespace Protocol
             Ping = 4,                /// Check that connection to the server is alive.
             TablesStatusRequest = 5, /// Check status of tables on the server.
             KeepAlive = 6,           /// Keep the connection alive
-            Scalar = 7               /// A block of data (compressed or not).
+            Scalar = 7,              /// A block of data (compressed or not).
+
+            MAX = Scalar,
         };
 
         inline const char * toString(UInt64 packet)
         {
-            static const char * data[] = { "Hello", "Query", "Data", "Cancel", "Ping", "TablesStatusRequest", "KeepAlive" };
-            return packet < 7
+            static const char * data[] = {
+                "Hello",
+                "Query",
+                "Data",
+                "Cancel",
+                "Ping",
+                "TablesStatusRequest",
+                "KeepAlive",
+            };
+            return packet <= MAX
                 ? data[packet]
                 : "Unknown packet";
         }
diff --git a/src/Dictionaries/ClickHouseDictionarySource.cpp b/src/Dictionaries/ClickHouseDictionarySource.cpp
index 4c119e13def..8199b16a94b 100644
--- a/src/Dictionaries/ClickHouseDictionarySource.cpp
+++ b/src/Dictionaries/ClickHouseDictionarySource.cpp
@@ -40,6 +40,8 @@ static ConnectionPoolWithFailoverPtr createPool(
         db,
         user,
         password,
+        "", /* cluster */
+        "", /* cluster_secret */
         "ClickHouseDictionarySource",
         Protocol::Compression::Enable,
         secure ? Protocol::Secure::Enable : Protocol::Secure::Disable));
diff --git a/src/Interpreters/Cluster.cpp b/src/Interpreters/Cluster.cpp
index 6558ebf63d5..ea9f43ee93f 100644
--- a/src/Interpreters/Cluster.cpp
+++ b/src/Interpreters/Cluster.cpp
@@ -73,8 +73,16 @@ bool Cluster::Address::isLocal(UInt16 clickhouse_port) const
 
 
 Cluster::Address::Address(
-    const Poco::Util::AbstractConfiguration & config, const String & config_prefix, UInt32 shard_index_, UInt32 replica_index_)
-    : shard_index(shard_index_), replica_index(replica_index_)
+        const Poco::Util::AbstractConfiguration & config,
+        const String & config_prefix,
+        const String & cluster_,
+        const String & cluster_secret_,
+        UInt32 shard_index_,
+        UInt32 replica_index_)
+    : cluster(cluster_)
+    , cluster_secret(cluster_secret_)
+    , shard_index(shard_index_)
+    , replica_index(replica_index_)
 {
     host_name = config.getString(config_prefix + ".host");
     port = static_cast<UInt16>(config.getInt(config_prefix + ".port"));
@@ -92,8 +100,15 @@ Cluster::Address::Address(
 }
 
 
-Cluster::Address::Address(const String & host_port_, const String & user_, const String & password_, UInt16 clickhouse_port, bool secure_, Int64 priority_)
-    : user(user_), password(password_)
+Cluster::Address::Address(
+        const String & host_port_,
+        const String & user_,
+        const String & password_,
+        UInt16 clickhouse_port,
+        bool secure_,
+        Int64 priority_)
+    : user(user_)
+    , password(password_)
 {
     auto parsed_host_port = parseAddress(host_port_, clickhouse_port);
     host_name = parsed_host_port.first;
@@ -219,9 +234,9 @@ Cluster::Address Cluster::Address::fromFullString(const String & full_string)
 
 /// Implementation of Clusters class
 
-Clusters::Clusters(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & config_name)
+Clusters::Clusters(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & config_prefix)
 {
-    updateClusters(config, settings, config_name);
+    updateClusters(config, settings, config_prefix);
 }
 
 
@@ -241,10 +256,10 @@ void Clusters::setCluster(const String & cluster_name, const std::shared_ptr<Clu
 }
 
 
-void Clusters::updateClusters(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & config_name)
+void Clusters::updateClusters(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & config_prefix)
 {
     Poco::Util::AbstractConfiguration::Keys config_keys;
-    config.keys(config_name, config_keys);
+    config.keys(config_prefix, config_keys);
 
     std::lock_guard lock(mutex);
 
@@ -254,7 +269,7 @@ void Clusters::updateClusters(const Poco::Util::AbstractConfiguration & config,
         if (key.find('.') != String::npos)
             throw Exception("Cluster names with dots are not supported: '" + key + "'", ErrorCodes::SYNTAX_ERROR);
 
-        impl.emplace(key, std::make_shared<Cluster>(config, settings, config_name + "." + key));
+        impl.emplace(key, std::make_shared<Cluster>(config, settings, config_prefix, key));
     }
 }
 
@@ -268,18 +283,25 @@ Clusters::Impl Clusters::getContainer() const
 
 /// Implementation of `Cluster` class
 
-Cluster::Cluster(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & cluster_name)
+Cluster::Cluster(const Poco::Util::AbstractConfiguration & config,
+                 const Settings & settings,
+                 const String & config_prefix_,
+                 const String & cluster_name)
 {
+    auto config_prefix = config_prefix_ + "." + cluster_name;
+
     Poco::Util::AbstractConfiguration::Keys config_keys;
-    config.keys(cluster_name, config_keys);
+    config.keys(config_prefix, config_keys);
+
+    config_prefix += ".";
+
+    secret = config.getString(config_prefix + "secret", "");
+    std::erase(config_keys, "secret");
 
     if (config_keys.empty())
-        throw Exception("No cluster elements (shard, node) specified in config at path " + cluster_name, ErrorCodes::SHARD_HAS_NO_CONNECTIONS);
-
-    const auto & config_prefix = cluster_name + ".";
+        throw Exception("No cluster elements (shard, node) specified in config at path " + config_prefix, ErrorCodes::SHARD_HAS_NO_CONNECTIONS);
 
     UInt32 current_shard_num = 1;
-
     for (const auto & key : config_keys)
     {
         if (startsWith(key, "node"))
@@ -291,7 +313,7 @@ Cluster::Cluster(const Poco::Util::AbstractConfiguration & config, const Setting
             const auto & prefix = config_prefix + key;
             const auto weight = config.getInt(prefix + ".weight", default_weight);
 
-            addresses.emplace_back(config, prefix, current_shard_num, 1);
+            addresses.emplace_back(config, prefix, cluster_name, secret, current_shard_num, 1);
             const auto & address = addresses.back();
 
             ShardInfo info;
@@ -305,6 +327,7 @@ Cluster::Cluster(const Poco::Util::AbstractConfiguration & config, const Setting
                 settings.distributed_connections_pool_size,
                 address.host_name, address.port,
                 address.default_database, address.user, address.password,
+                address.cluster, address.cluster_secret,
                 "server", address.compression,
                 address.secure, address.priority);
 
@@ -345,7 +368,12 @@ Cluster::Cluster(const Poco::Util::AbstractConfiguration & config, const Setting
 
                 if (startsWith(replica_key, "replica"))
                 {
-                    replica_addresses.emplace_back(config, partial_prefix + replica_key, current_shard_num, current_replica_num);
+                    replica_addresses.emplace_back(config,
+                        partial_prefix + replica_key,
+                        cluster_name,
+                        secret,
+                        current_shard_num,
+                        current_replica_num);
                     ++current_replica_num;
 
                     if (internal_replication)
@@ -379,6 +407,7 @@ Cluster::Cluster(const Poco::Util::AbstractConfiguration & config, const Setting
                     settings.distributed_connections_pool_size,
                     replica.host_name, replica.port,
                     replica.default_database, replica.user, replica.password,
+                    replica.cluster, replica.cluster_secret,
                     "server", replica.compression,
                     replica.secure, replica.priority);
 
@@ -442,6 +471,7 @@ Cluster::Cluster(const Settings & settings, const std::vector<std::vector<String
                         settings.distributed_connections_pool_size,
                         replica.host_name, replica.port,
                         replica.default_database, replica.user, replica.password,
+                        replica.cluster, replica.cluster_secret,
                         "server", replica.compression, replica.secure, replica.priority);
             all_replicas.emplace_back(replica_pool);
             if (replica.is_local && !treat_local_as_remote)
@@ -546,6 +576,8 @@ Cluster::Cluster(Cluster::ReplicasAsShardsTag, const Cluster & from, const Setti
                 address.default_database,
                 address.user,
                 address.password,
+                address.cluster,
+                address.cluster_secret,
                 "server",
                 address.compression,
                 address.secure,
diff --git a/src/Interpreters/Cluster.h b/src/Interpreters/Cluster.h
index 9633577bf6a..4985c70e6e2 100644
--- a/src/Interpreters/Cluster.h
+++ b/src/Interpreters/Cluster.h
@@ -20,12 +20,17 @@ namespace ErrorCodes
 class Cluster
 {
 public:
-    Cluster(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & cluster_name);
+    Cluster(const Poco::Util::AbstractConfiguration & config,
+            const Settings & settings,
+            const String & config_prefix_,
+            const String & cluster_name);
 
     /// Construct a cluster by the names of shards and replicas.
     /// Local are treated as well as remote ones if treat_local_as_remote is true.
     /// 'clickhouse_port' - port that this server instance listen for queries.
     /// This parameter is needed only to check that some address is local (points to ourself).
+    ///
+    /// Used for remote() function.
     Cluster(const Settings & settings, const std::vector<std::vector<String>> & names,
             const String & username, const String & password,
             UInt16 clickhouse_port, bool treat_local_as_remote,
@@ -62,6 +67,11 @@ public:
         UInt16 port;
         String user;
         String password;
+
+        /// For inter-server authorization
+        String cluster;
+        String cluster_secret;
+
         UInt32 shard_index{}; /// shard serial number in configuration file, starting from 1.
         UInt32 replica_index{}; /// replica serial number in this shard, starting from 1; zero means no replicas.
 
@@ -80,6 +90,8 @@ public:
         Address(
             const Poco::Util::AbstractConfiguration & config,
             const String & config_prefix,
+            const String & cluster_,
+            const String & cluster_secret_,
             UInt32 shard_index_ = 0,
             UInt32 replica_index_ = 0);
         Address(
@@ -170,6 +182,8 @@ public:
     /// The number of all shards.
     size_t getShardCount() const { return shards_info.size(); }
 
+    const String & getSecret() const { return secret; }
+
     /// Get a subcluster consisting of one shard - index by count (from 0) of the shard of this cluster.
     std::unique_ptr<Cluster> getClusterWithSingleShard(size_t index) const;
 
@@ -197,6 +211,9 @@ private:
     struct ReplicasAsShardsTag {};
     Cluster(ReplicasAsShardsTag, const Cluster & from, const Settings & settings);
 
+    /// Inter-server secret
+    String secret;
+
     String hash_of_addresses;
     /// Description of the cluster shards.
     ShardsInfo shards_info;
@@ -219,7 +236,7 @@ using ClusterPtr = std::shared_ptr<Cluster>;
 class Clusters
 {
 public:
-    Clusters(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & config_name = "remote_servers");
+    Clusters(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & config_prefix = "remote_servers");
 
     Clusters(const Clusters &) = delete;
     Clusters & operator=(const Clusters &) = delete;
@@ -227,7 +244,7 @@ public:
     ClusterPtr getCluster(const std::string & cluster_name) const;
     void setCluster(const String & cluster_name, const ClusterPtr & cluster);
 
-    void updateClusters(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & config_name);
+    void updateClusters(const Poco::Util::AbstractConfiguration & config, const Settings & settings, const String & config_prefix);
 
 public:
     using Impl = std::map<String, ClusterPtr>;
@@ -239,6 +256,4 @@ protected:
     mutable std::mutex mutex;
 };
 
-using ClustersPtr = std::shared_ptr<Clusters>;
-
 }
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 9013dd389d9..3138193a783 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -677,7 +677,7 @@ ConfigurationPtr Context::getUsersConfig()
 }
 
 
-void Context::setUser(const String & name, const String & password, const Poco::Net::SocketAddress & address)
+void Context::setUserImpl(const String & name, const std::optional<String> & password, const Poco::Net::SocketAddress & address)
 {
     auto lock = getLock();
 
@@ -686,7 +686,7 @@ void Context::setUser(const String & name, const String & password, const Poco::
 
 #if defined(ARCADIA_BUILD)
     /// This is harmful field that is used only in foreign "Arcadia" build.
-    client_info.current_password = password;
+    client_info.current_password = password.value_or("");
 #endif
 
     auto new_user_id = getAccessControlManager().find<User>(name);
@@ -694,7 +694,7 @@ void Context::setUser(const String & name, const String & password, const Poco::
     if (new_user_id)
     {
         new_access = getAccessControlManager().getContextAccess(*new_user_id, {}, true, settings, current_database, client_info);
-        if (!new_access->isClientHostAllowed() || !new_access->isCorrectPassword(password))
+        if (!new_access->isClientHostAllowed() || (password && !new_access->isCorrectPassword(*password)))
         {
             new_user_id = {};
             new_access = nullptr;
@@ -712,6 +712,16 @@ void Context::setUser(const String & name, const String & password, const Poco::
     setSettings(*access->getDefaultSettings());
 }
 
+void Context::setUser(const String & name, const String & password, const Poco::Net::SocketAddress & address)
+{
+    setUserImpl(name, std::make_optional(password), address);
+}
+
+void Context::setUserWithoutCheckingPassword(const String & name, const Poco::Net::SocketAddress & address)
+{
+    setUserImpl(name, {} /* no password */, address);
+}
+
 std::shared_ptr<const User> Context::getUser() const
 {
     return getAccess()->getUser();
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index 613889333c3..b15ea018573 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -258,6 +258,11 @@ public:
     /// Sets the current user, checks the password and that the specified host is allowed.
     /// Must be called before getClientInfo.
     void setUser(const String & name, const String & password, const Poco::Net::SocketAddress & address);
+    /// Sets the current user, *do not checks the password* but check that the specified host is allowed.
+    /// Must be called before getClientInfo.
+    ///
+    /// (Used only internally in cluster, if the secret matches)
+    void setUserWithoutCheckingPassword(const String & name, const Poco::Net::SocketAddress & address);
     void setQuotaKey(String quota_key_);
 
     UserPtr getUser() const;
@@ -638,6 +643,9 @@ private:
     StoragePolicySelectorPtr getStoragePolicySelector(std::lock_guard<std::mutex> & lock) const;
 
     DiskSelectorPtr getDiskSelector(std::lock_guard<std::mutex> & /* lock */) const;
+
+    /// If the password is not set, the password will not be checked
+    void setUserImpl(const String & name, const std::optional<String> & password, const Poco::Net::SocketAddress & address);
 };
 
 
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index 6ac433f8497..b3c7dee912f 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -6,6 +6,7 @@
 #include <Common/Stopwatch.h>
 #include <Common/NetException.h>
 #include <Common/setThreadName.h>
+#include <Common/OpenSSLHelpers.h>
 #include <IO/Progress.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <Compression/CompressedWriteBuffer.h>
@@ -51,6 +52,7 @@ namespace ErrorCodes
     extern const int POCO_EXCEPTION;
     extern const int SOCKET_TIMEOUT;
     extern const int UNEXPECTED_PACKET_FROM_CLIENT;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 
@@ -724,7 +726,7 @@ void TCPHandler::receiveHello()
 {
     /// Receive `hello` packet.
     UInt64 packet_type = 0;
-    String user = "default";
+    String user;
     String password;
 
     readVarUInt(packet_type, *in);
@@ -755,14 +757,25 @@ void TCPHandler::receiveHello()
     readStringBinary(user, *in);
     readStringBinary(password, *in);
 
+    if (user.empty())
+        throw NetException("Unexpected packet from client (no user in Hello package)", ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT);
+
     LOG_DEBUG(log, "Connected {} version {}.{}.{}, revision: {}{}{}.",
         client_name,
         client_version_major, client_version_minor, client_version_patch,
         client_revision,
         (!default_database.empty() ? ", database: " + default_database : ""),
-        (!user.empty() ? ", user: " + user : ""));
+        (!user.empty() ? ", user: " + user : "")
+    );
 
-    connection_context.setUser(user, password, socket().peerAddress());
+    if (user != USER_INTERSERVER_MARKER)
+    {
+        connection_context.setUser(user, password, socket().peerAddress());
+    }
+    else
+    {
+        receiveClusterNameAndSalt();
+    }
 }
 
 
@@ -844,6 +857,30 @@ bool TCPHandler::receivePacket()
     }
 }
 
+void TCPHandler::receiveClusterNameAndSalt()
+{
+    readStringBinary(cluster, *in);
+    readStringBinary(salt, *in, 32);
+
+    try
+    {
+        if (salt.empty())
+            throw NetException("Empty salt is not allowed", ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT);
+
+        cluster_secret = query_context->getCluster(cluster)->getSecret();
+    }
+    catch (const Exception & e)
+    {
+        try
+        {
+            /// We try to send error information to the client.
+            sendException(e, connection_context.getSettingsRef().calculate_text_stack_trace);
+        }
+        catch (...) {}
+
+        throw;
+    }
+}
 
 void TCPHandler::receiveQuery()
 {
@@ -881,10 +918,6 @@ void TCPHandler::receiveQuery()
         client_info.initial_query_id = client_info.current_query_id;
         client_info.initial_address = client_info.current_address;
     }
-    else
-    {
-        query_context->setInitialRowPolicy();
-    }
 
     /// Per query settings are also passed via TCP.
     /// We need to check them before applying due to they can violate the settings constraints.
@@ -892,6 +925,67 @@ void TCPHandler::receiveQuery()
                                                                                                       : SettingsWriteFormat::BINARY;
     Settings passed_settings;
     passed_settings.read(*in, settings_format);
+
+    /// Interserver secret.
+    std::string received_hash;
+    if (client_revision >= DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET)
+    {
+        readStringBinary(received_hash, *in, 32);
+    }
+
+    readVarUInt(stage, *in);
+    state.stage = QueryProcessingStage::Enum(stage);
+
+    readVarUInt(compression, *in);
+    state.compression = static_cast<Protocol::Compression>(compression);
+
+    readStringBinary(state.query, *in);
+
+    /// It is OK to check only when query != INITIAL_QUERY,
+    /// since only in that case the actions will be done.
+    if (!cluster.empty() && client_info.query_kind != ClientInfo::QueryKind::INITIAL_QUERY)
+    {
+#if USE_SSL
+        std::string data(salt);
+        data += cluster_secret;
+        data += state.query;
+        data += state.query_id;
+        data += client_info.initial_user;
+
+        std::string calculated_hash;
+        calculated_hash.resize(32);
+
+        if (received_hash.size() != calculated_hash.size())
+            throw NetException("Unexpected hash received from client", ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT);
+
+        encodeSHA256(data, reinterpret_cast<unsigned char *>(calculated_hash.data()));
+
+        if (calculated_hash != received_hash)
+            throw NetException("Hash mismatch", ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT);
+        /// TODO: change error code?
+
+        /// initial_user can be empty in case of Distributed INSERT via Buffer/Kafka,
+        /// i.e. when the INSERT is done with the global context (w/o user).
+        if (!client_info.initial_user.empty())
+        {
+            query_context->setUserWithoutCheckingPassword(client_info.initial_user, socket().peerAddress());
+            LOG_DEBUG(log, "User (initial): {}", query_context->getUserName());
+        }
+        /// No need to update connection_context, since it does not requires user (it will not be used for query execution)
+#else
+        throw Exception(
+            "Inter-server secret support is disabled, because ClickHouse was built without SSL library",
+            ErrorCodes::SUPPORT_IS_DISABLED);
+#endif
+    }
+    else
+    {
+        query_context->setInitialRowPolicy();
+    }
+
+    ///
+    /// Settings
+    ///
     auto settings_changes = passed_settings.changes();
     if (client_info.query_kind == ClientInfo::QueryKind::INITIAL_QUERY)
     {
@@ -905,20 +999,11 @@ void TCPHandler::receiveQuery()
     }
     query_context->applySettingsChanges(settings_changes);
     const Settings & settings = query_context->getSettingsRef();
-
     /// Sync timeouts on client and server during current query to avoid dangling queries on server
     /// NOTE: We use settings.send_timeout for the receive timeout and vice versa (change arguments ordering in TimeoutSetter),
     ///  because settings.send_timeout is client-side setting which has opposite meaning on the server side.
     /// NOTE: these settings are applied only for current connection (not for distributed tables' connections)
     state.timeout_setter = std::make_unique<TimeoutSetter>(socket(), settings.receive_timeout, settings.send_timeout);
-
-    readVarUInt(stage, *in);
-    state.stage = QueryProcessingStage::Enum(stage);
-
-    readVarUInt(compression, *in);
-    state.compression = static_cast<Protocol::Compression>(compression);
-
-    readStringBinary(state.query, *in);
 }
 
 void TCPHandler::receiveUnexpectedQuery()
@@ -937,6 +1022,11 @@ void TCPHandler::receiveUnexpectedQuery()
                                                                                                       : SettingsWriteFormat::BINARY;
     skip_settings.read(*in, settings_format);
 
+    std::string skip_hash;
+    bool interserver_secret = client_revision >= DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET;
+    if (interserver_secret)
+        readStringBinary(skip_hash, *in, 32);
+
     readVarUInt(skip_uint_64, *in);
     readVarUInt(skip_uint_64, *in);
     readStringBinary(skip_string, *in);
diff --git a/src/Server/TCPHandler.h b/src/Server/TCPHandler.h
index 3fec89264be..3771755892f 100644
--- a/src/Server/TCPHandler.h
+++ b/src/Server/TCPHandler.h
@@ -97,7 +97,6 @@ struct LastBlockInputParameters
     Block header;
 };
 
-
 class TCPHandler : public Poco::Net::TCPServerConnection
 {
 public:
@@ -139,6 +138,12 @@ private:
 
     String default_database;
 
+    /// For inter-server secret (remote_server.*.secret)
+    String salt;
+    String cluster;
+    String cluster_secret;
+
+
     /// At the moment, only one ongoing query in the connection is supported at a time.
     QueryState state;
 
@@ -187,6 +192,8 @@ private:
     void sendTotals(const Block & totals);
     void sendExtremes(const Block & extremes);
 
+    void receiveClusterNameAndSalt();
+
     /// Creates state.block_in/block_out for blocks read/write, depending on whether compression is enabled.
     void initBlockInput();
     void initBlockOutput(const Block & block);
diff --git a/src/Storages/Distributed/DirectoryMonitor.cpp b/src/Storages/Distributed/DirectoryMonitor.cpp
index b67d3283ac9..dfb35f62bc4 100644
--- a/src/Storages/Distributed/DirectoryMonitor.cpp
+++ b/src/Storages/Distributed/DirectoryMonitor.cpp
@@ -236,8 +236,17 @@ ConnectionPoolPtr StorageDistributedDirectoryMonitor::createPool(const std::stri
         }
 
         return std::make_shared<ConnectionPool>(
-            1, address.host_name, address.port, address.default_database, address.user, address.password,
-            storage.getName() + '_' + address.user, Protocol::Compression::Enable, address.secure);
+            1, /* max_connections */
+            address.host_name,
+            address.port,
+            address.default_database,
+            address.user,
+            address.password,
+            address.cluster,
+            address.cluster_secret,
+            storage.getName() + '_' + address.user, /* client */
+            Protocol::Compression::Enable,
+            address.secure);
     };
 
     auto pools = createPoolsForAddresses(name, pool_factory);
diff --git a/tests/integration/test_distributed_inter_server_secret/__init__.py b/tests/integration/test_distributed_inter_server_secret/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_distributed_inter_server_secret/configs/remote_servers.xml b/tests/integration/test_distributed_inter_server_secret/configs/remote_servers.xml
new file mode 100644
index 00000000000..0ff521ac800
--- /dev/null
+++ b/tests/integration/test_distributed_inter_server_secret/configs/remote_servers.xml
@@ -0,0 +1,26 @@
+<yandex>
+    <remote_servers>
+        <insecure>
+            <node>
+                <host>n1</host>
+                <port>9000</port>
+            </node>
+            <node>
+                <host>n2</host>
+                <port>9000</port>
+            </node>
+        </insecure>
+
+        <secure>
+            <secret>foo</secret>
+            <node>
+                <host>n1</host>
+                <port>9000</port>
+            </node>
+            <node>
+                <host>n2</host>
+                <port>9000</port>
+            </node>
+        </secure>
+    </remote_servers>
+</yandex>
diff --git a/tests/integration/test_distributed_inter_server_secret/configs/remote_servers_n1.xml b/tests/integration/test_distributed_inter_server_secret/configs/remote_servers_n1.xml
new file mode 100644
index 00000000000..70f8cee679a
--- /dev/null
+++ b/tests/integration/test_distributed_inter_server_secret/configs/remote_servers_n1.xml
@@ -0,0 +1,15 @@
+<yandex>
+    <remote_servers>
+        <secure_disagree>
+            <secret>bar_n1</secret>
+            <node>
+                <host>n1</host>
+                <port>9000</port>
+            </node>
+            <node>
+                <host>n2</host>
+                <port>9000</port>
+            </node>
+        </secure_disagree>
+    </remote_servers>
+</yandex>
diff --git a/tests/integration/test_distributed_inter_server_secret/configs/remote_servers_n2.xml b/tests/integration/test_distributed_inter_server_secret/configs/remote_servers_n2.xml
new file mode 100644
index 00000000000..316e8a49afa
--- /dev/null
+++ b/tests/integration/test_distributed_inter_server_secret/configs/remote_servers_n2.xml
@@ -0,0 +1,15 @@
+<yandex>
+    <remote_servers>
+        <secure_disagree>
+            <secret>bar_n2</secret>
+            <node>
+                <host>n1</host>
+                <port>9000</port>
+            </node>
+            <node>
+                <host>n2</host>
+                <port>9000</port>
+            </node>
+        </secure_disagree>
+    </remote_servers>
+</yandex>
diff --git a/tests/integration/test_distributed_inter_server_secret/configs/users.xml b/tests/integration/test_distributed_inter_server_secret/configs/users.xml
new file mode 100644
index 00000000000..1b012bfea9c
--- /dev/null
+++ b/tests/integration/test_distributed_inter_server_secret/configs/users.xml
@@ -0,0 +1,41 @@
+<?xml version="1.0"?>
+<yandex>
+    <profiles>
+        <default>
+        </default>
+    </profiles>
+
+    <users>
+        <default>
+            <password></password>
+            <networks>
+                <ip>::/0</ip>
+            </networks>
+            <profile>default</profile>
+            <quota>default</quota>
+        </default>
+
+        <nopass>
+            <password></password>
+            <networks>
+                <ip>::/0</ip>
+            </networks>
+            <profile>default</profile>
+            <quota>default</quota>
+        </nopass>
+
+        <pass>
+            <password>foo</password>
+            <networks>
+                <ip>::/0</ip>
+            </networks>
+            <profile>default</profile>
+            <quota>default</quota>
+        </pass>
+    </users>
+
+    <quotas>
+        <default>
+        </default>
+    </quotas>
+</yandex>
diff --git a/tests/integration/test_distributed_inter_server_secret/test.py b/tests/integration/test_distributed_inter_server_secret/test.py
new file mode 100644
index 00000000000..b39f9dec861
--- /dev/null
+++ b/tests/integration/test_distributed_inter_server_secret/test.py
@@ -0,0 +1,152 @@
+# pylint: disable=unused-argument
+# pylint: disable=redefined-outer-name
+# pylint: disable=line-too-long
+
+import pytest
+
+from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+
+def make_instance(name, cfg):
+    return cluster.add_instance(name,
+        with_zookeeper=True,
+        main_configs=['configs/remote_servers.xml', cfg],
+        user_configs=['configs/users.xml'])
+# _n1/_n2 contains cluster with different <secret> -- should fail
+n1 = make_instance('n1', 'configs/remote_servers_n1.xml')
+n2 = make_instance('n2', 'configs/remote_servers_n2.xml')
+
+users = pytest.mark.parametrize('user,password', [
+    ('default', ''   ),
+    ('nopass',  ''   ),
+    ('pass',    'foo'),
+])
+
+def bootstrap():
+    for n in cluster.instances.values():
+        n.query('DROP TABLE IF EXISTS data')
+        n.query('DROP TABLE IF EXISTS dist')
+        n.query('CREATE TABLE data (key Int) Engine=Memory()')
+        n.query("""
+        CREATE TABLE dist_insecure AS data
+        Engine=Distributed(insecure, currentDatabase(), data, key)
+        """)
+        n.query("""
+        CREATE TABLE dist_secure AS data
+        Engine=Distributed(secure, currentDatabase(), data, key)
+        """)
+        n.query("""
+        CREATE TABLE dist_secure_disagree AS data
+        Engine=Distributed(secure_disagree, currentDatabase(), data, key)
+        """)
+        n.query("""
+        CREATE TABLE dist_secure_buffer AS dist_secure
+        Engine=Buffer(currentDatabase(), dist_secure,
+            /* settings for manual flush only */
+            1,    /* num_layers */
+            10e6, /* min_time, placeholder */
+            10e6, /* max_time, placeholder */
+            0,    /* min_rows   */
+            10e6, /* max_rows   */
+            0,    /* min_bytes  */
+            80e6  /* max_bytes  */
+        )
+        """)
+
+@pytest.fixture(scope='module', autouse=True)
+def start_cluster():
+    try:
+        cluster.start()
+        bootstrap()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+def query_with_id(node, id_, query, **kwargs):
+    return node.query("WITH '{}' AS __id {}".format(id_, query), **kwargs)
+
+# @return -- [user, initial_user]
+def get_query_user_info(node, query_pattern):
+    node.query("SYSTEM FLUSH LOGS")
+    return node.query("""
+    SELECT user, initial_user
+    FROM system.query_log
+    WHERE
+        query LIKE '%{}%' AND
+        query NOT LIKE '%system.query_log%' AND
+        type = 'QueryFinish'
+    """.format(query_pattern)).strip().split('\t')
+
+def test_insecure():
+    n1.query('SELECT * FROM dist_insecure')
+
+def test_insecure_insert_async():
+    n1.query('INSERT INTO dist_insecure SELECT * FROM numbers(2)')
+    n1.query('SYSTEM FLUSH DISTRIBUTED ON CLUSTER insecure dist_insecure')
+    assert int(n1.query('SELECT count() FROM dist_insecure')) == 2
+    n1.query('TRUNCATE TABLE data ON CLUSTER insecure')
+
+def test_insecure_insert_sync():
+    n1.query('INSERT INTO dist_insecure SELECT * FROM numbers(2)', settings={'insert_distributed_sync': 1})
+    assert int(n1.query('SELECT count() FROM dist_insecure')) == 2
+    n1.query('TRUNCATE TABLE data ON CLUSTER secure')
+
+def test_secure():
+    n1.query('SELECT * FROM dist_secure')
+
+def test_secure_insert_async():
+    n1.query('INSERT INTO dist_secure SELECT * FROM numbers(2)')
+    n1.query('SYSTEM FLUSH DISTRIBUTED ON CLUSTER secure dist_secure')
+    assert int(n1.query('SELECT count() FROM dist_secure')) == 2
+    n1.query('TRUNCATE TABLE data ON CLUSTER secure')
+
+def test_secure_insert_sync():
+    n1.query('INSERT INTO dist_secure SELECT * FROM numbers(2)', settings={'insert_distributed_sync': 1})
+    assert int(n1.query('SELECT count() FROM dist_secure')) == 2
+    n1.query('TRUNCATE TABLE data ON CLUSTER secure')
+
+# INSERT w/o initial_user
+#
+# Buffer() flush happens with global context, that does not have user
+# And so Context::user/ClientInfo::current_user/ClientInfo::initial_user will be empty
+def test_secure_insert_buffer_async():
+    n1.query('INSERT INTO dist_secure_buffer SELECT * FROM numbers(2)')
+    n1.query('SYSTEM FLUSH DISTRIBUTED ON CLUSTER secure dist_secure')
+    # no Buffer flush happened
+    assert int(n1.query('SELECT count() FROM dist_secure')) == 0
+    n1.query('OPTIMIZE TABLE dist_secure_buffer')
+    # manual flush
+    n1.query('SYSTEM FLUSH DISTRIBUTED ON CLUSTER secure dist_secure')
+    assert int(n1.query('SELECT count() FROM dist_secure')) == 2
+    n1.query('TRUNCATE TABLE data ON CLUSTER secure')
+
+def test_secure_disagree():
+    with pytest.raises(QueryRuntimeException, match='.*Hash mismatch.*'):
+        n1.query('SELECT * FROM dist_secure_disagree')
+
+def test_secure_disagree_insert():
+    n1.query('INSERT INTO dist_secure_disagree SELECT * FROM numbers(2)')
+    with pytest.raises(QueryRuntimeException, match='.*Hash mismatch.*'):
+        n1.query('SYSTEM FLUSH DISTRIBUTED ON CLUSTER secure_disagree dist_secure_disagree')
+    # check the the connection will be re-established
+    # IOW that we will not get "Unknown BlockInfo field"
+    with pytest.raises(QueryRuntimeException, match='.*Hash mismatch.*'):
+        assert int(n1.query('SELECT count() FROM dist_secure_disagree')) == 0
+
+@users
+def test_user_insecure_cluster(user, password):
+    id_ = 'query-dist_insecure-' + user
+    query_with_id(n1, id_, 'SELECT * FROM dist_insecure', user=user, password=password)
+    assert get_query_user_info(n1, id_) == [user, user] # due to prefer_localhost_replica
+    assert get_query_user_info(n2, id_) == ['default', user]
+
+@users
+def test_user_secure_cluster(user, password):
+    id_ = 'query-dist_secure-' + user
+    query_with_id(n1, id_, 'SELECT * FROM dist_secure', user=user, password=password)
+    assert get_query_user_info(n1, id_) == [user, user]
+    assert get_query_user_info(n2, id_) == [user, user]
+
+# TODO: check user for INSERT

From 785d1b2a75b6ef7584babeefd4595602de0b93c4 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 10 Sep 2020 21:24:53 +0300
Subject: [PATCH 220/341] OpenSSLHelpers cleanup

Add few more specializations for encodeSHA256():
- std::string encodeSHA256(const std::string_view &);
- std::string encodeSHA256(const void *, size_t);
- void encodeSHA256(const void *, size_t, unsigned char *);
---
 src/Client/Connection.cpp     |  9 ++-------
 src/Common/OpenSSLHelpers.cpp | 17 ++++++++++++++++-
 src/Common/OpenSSLHelpers.h   |  7 ++++++-
 src/Server/TCPHandler.cpp     |  7 ++-----
 4 files changed, 26 insertions(+), 14 deletions(-)

diff --git a/src/Client/Connection.cpp b/src/Client/Connection.cpp
index a52dcf66efb..d8fe865136f 100644
--- a/src/Client/Connection.cpp
+++ b/src/Client/Connection.cpp
@@ -312,13 +312,10 @@ void Connection::forceConnected(const ConnectionTimeouts & timeouts)
 #if USE_SSL
 void Connection::sendClusterNameAndSalt()
 {
-    salt.clear();
     pcg64_fast rng(randomSeed());
     UInt64 rand = rng();
-    std::string_view data(reinterpret_cast<char *>(&rand), sizeof(rand));
 
-    salt.resize(32);
-    encodeSHA256(data, reinterpret_cast<unsigned char *>(salt.data()));
+    salt = encodeSHA256(&rand, sizeof(rand));
 
     writeStringBinary(cluster, *out);
     writeStringBinary(salt, *out);
@@ -462,9 +459,7 @@ void Connection::sendQuery(
             data += client_info->initial_user;
             /// TODO: add source/target host/ip-address
 
-            std::string hash;
-            hash.resize(32);
-            encodeSHA256(data, reinterpret_cast<unsigned char *>(hash.data()));
+            std::string hash = encodeSHA256(data);
             writeStringBinary(hash, *out);
 #else
         throw Exception(
diff --git a/src/Common/OpenSSLHelpers.cpp b/src/Common/OpenSSLHelpers.cpp
index cfd47c684f3..77abbf99a90 100644
--- a/src/Common/OpenSSLHelpers.cpp
+++ b/src/Common/OpenSSLHelpers.cpp
@@ -12,11 +12,26 @@ namespace DB
 {
 #pragma GCC diagnostic warning "-Wold-style-cast"
 
+std::string encodeSHA256(const std::string_view & text)
+{
+    return encodeSHA256(text.data(), text.size());
+}
+std::string encodeSHA256(const void * text, size_t size)
+{
+    std::string out;
+    out.resize(32);
+    encodeSHA256(text, size, reinterpret_cast<unsigned char *>(out.data()));
+    return out;
+}
 void encodeSHA256(const std::string_view & text, unsigned char * out)
+{
+    encodeSHA256(text.data(), text.size(), out);
+}
+void encodeSHA256(const void * text, size_t size, unsigned char * out)
 {
     SHA256_CTX ctx;
     SHA256_Init(&ctx);
-    SHA256_Update(&ctx, reinterpret_cast<const UInt8 *>(text.data()), text.size());
+    SHA256_Update(&ctx, reinterpret_cast<const UInt8 *>(text), size);
     SHA256_Final(out, &ctx);
 }
 
diff --git a/src/Common/OpenSSLHelpers.h b/src/Common/OpenSSLHelpers.h
index e77fc3037c1..841127bee88 100644
--- a/src/Common/OpenSSLHelpers.h
+++ b/src/Common/OpenSSLHelpers.h
@@ -10,8 +10,13 @@
 
 namespace DB
 {
-/// Encodes `text` and puts the result to `out` which must be at least 32 bytes long.
+
+/// Encodes `text` and returns it.
+std::string encodeSHA256(const std::string_view & text);
+std::string encodeSHA256(const void * text, size_t size);
+/// `out` must be at least 32 bytes long.
 void encodeSHA256(const std::string_view & text, unsigned char * out);
+void encodeSHA256(const void * text, size_t size, unsigned char * out);
 
 /// Returns concatenation of error strings for all errors that OpenSSL has recorded, emptying the error queue.
 String getOpenSSLErrors();
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index b3c7dee912f..d3a5ea38f3f 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -952,13 +952,10 @@ void TCPHandler::receiveQuery()
         data += state.query_id;
         data += client_info.initial_user;
 
-        std::string calculated_hash;
-        calculated_hash.resize(32);
-
-        if (received_hash.size() != calculated_hash.size())
+        if (received_hash.size() != 32)
             throw NetException("Unexpected hash received from client", ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT);
 
-        encodeSHA256(data, reinterpret_cast<unsigned char *>(calculated_hash.data()));
+        std::string calculated_hash = encodeSHA256(data);
 
         if (calculated_hash != received_hash)
             throw NetException("Hash mismatch", ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT);

From 3fb548b3bb0e47a5d64cb37268107599aacdd1e2 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 13 Sep 2020 01:27:44 +0300
Subject: [PATCH 221/341] Cluster: use boost::range::remove_erase() over
 std::erase (c++20)

@vitlibar:

  "Yandex synchronization check says

  src/Interpreters/Cluster.cpp:299:10: error: no member named 'erase' in namespace 'std'
      std::erase(config_keys, "secret");
      ~~~~~^
  1 error generated.
  Please replace std::erase with boost::range::remove_erase."

  "That's quite an unusual build which links ClickHouse with a lot of closed source code and which still can't use most of C++20 features."
---
 src/Interpreters/Cluster.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/Cluster.cpp b/src/Interpreters/Cluster.cpp
index ea9f43ee93f..b385e74adc5 100644
--- a/src/Interpreters/Cluster.cpp
+++ b/src/Interpreters/Cluster.cpp
@@ -11,6 +11,7 @@
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Poco/Util/Application.h>
 #include <ext/range.h>
+#include <boost/range/algorithm_ext/erase.hpp>
 
 namespace DB
 {
@@ -296,7 +297,7 @@ Cluster::Cluster(const Poco::Util::AbstractConfiguration & config,
     config_prefix += ".";
 
     secret = config.getString(config_prefix + "secret", "");
-    std::erase(config_keys, "secret");
+    boost::range::remove_erase(config_keys, "secret");
 
     if (config_keys.empty())
         throw Exception("No cluster elements (shard, node) specified in config at path " + config_prefix, ErrorCodes::SHARD_HAS_NO_CONNECTIONS);

From 85b63ecadf082d3bc957268af568b3d4603d17f2 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 12 Sep 2020 19:55:44 +0300
Subject: [PATCH 222/341] Bump revision manually (to make it compatible with
 other version from this tag)

As @alexey-milovidov wrote.

P.S. I did not use ./utils/release/release_lib.sh (via ./release), since
it is pretty complex (it fetches tags and so on)

The following macros has been updated:
- VERSION_REVISION -- usually bumped with utils/release/release_lib.sh
  (interesting that even if there were no changes)
- DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET
- DBMS_TCP_PROTOCOL_VERSION -- does not affect anything, some internal
  yandex stuff
---
 cmake/autogenerated_versions.txt | 2 +-
 src/Core/Defines.h               | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/cmake/autogenerated_versions.txt b/cmake/autogenerated_versions.txt
index 6ca3999ff7f..407e391b445 100644
--- a/cmake/autogenerated_versions.txt
+++ b/cmake/autogenerated_versions.txt
@@ -1,5 +1,5 @@
 # This strings autochanged from release_lib.sh:
-SET(VERSION_REVISION 54440)
+SET(VERSION_REVISION 54441)
 SET(VERSION_MAJOR 20)
 SET(VERSION_MINOR 10)
 SET(VERSION_PATCH 1)
diff --git a/src/Core/Defines.h b/src/Core/Defines.h
index d3e2d0fd336..3a7d29e92b1 100644
--- a/src/Core/Defines.h
+++ b/src/Core/Defines.h
@@ -68,10 +68,10 @@
 #define DBMS_MIN_REVISION_WITH_SETTINGS_SERIALIZED_AS_STRINGS 54429
 
 /// Mininum revision supporting interserver secret.
-#define DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET 54440
+#define DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET 54441
 
 /// Version of ClickHouse TCP protocol. Set to git tag with latest protocol change.
-#define DBMS_TCP_PROTOCOL_VERSION 54440
+#define DBMS_TCP_PROTOCOL_VERSION 54441
 
 /// The boundary on which the blocks for asynchronous file operations should be aligned.
 #define DEFAULT_AIO_FILE_BLOCK_SIZE 4096

From 0f53b449fd5b12452436ebcc20e1771720d177cb Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitbar@yandex-team.ru>
Date: Tue, 15 Sep 2020 01:51:53 +0300
Subject: [PATCH 223/341] Add 'params' column to system.user_directories table.

---
 src/Access/AccessControlManager.cpp           |  4 +--
 src/Access/DiskAccessStorage.cpp              | 20 +++++++++++--
 src/Access/DiskAccessStorage.h                |  7 +++--
 src/Access/IAccessStorage.h                   |  5 ++--
 src/Access/UsersConfigAccessStorage.cpp       | 22 ++++++++++++++-
 src/Access/UsersConfigAccessStorage.h         |  6 ++--
 .../System/StorageSystemUserDirectories.cpp   | 12 +++-----
 .../integration/test_user_directories/test.py | 28 +++++++++----------
 8 files changed, 70 insertions(+), 34 deletions(-)

diff --git a/src/Access/AccessControlManager.cpp b/src/Access/AccessControlManager.cpp
index 41137867213..93a6d2dd255 100644
--- a/src/Access/AccessControlManager.cpp
+++ b/src/Access/AccessControlManager.cpp
@@ -186,7 +186,7 @@ void AccessControlManager::addUsersConfigStorage(
     {
         if (auto users_config_storage = typeid_cast<std::shared_ptr<UsersConfigAccessStorage>>(storage))
         {
-            if (users_config_storage->getStoragePath() == users_config_path_)
+            if (users_config_storage->isPathEqual(users_config_path_))
                 return;
         }
     }
@@ -229,7 +229,7 @@ void AccessControlManager::addDiskStorage(const String & storage_name_, const St
     {
         if (auto disk_storage = typeid_cast<std::shared_ptr<DiskAccessStorage>>(storage))
         {
-            if (disk_storage->isStoragePathEqual(directory_))
+            if (disk_storage->isPathEqual(directory_))
             {
                 if (readonly_)
                     disk_storage->setReadOnly(readonly_);
diff --git a/src/Access/DiskAccessStorage.cpp b/src/Access/DiskAccessStorage.cpp
index 9965e54df7e..0c7425327ad 100644
--- a/src/Access/DiskAccessStorage.cpp
+++ b/src/Access/DiskAccessStorage.cpp
@@ -33,6 +33,9 @@
 #include <Interpreters/InterpreterShowGrantsQuery.h>
 #include <Common/quoteString.h>
 #include <Core/Defines.h>
+#include <Poco/JSON/JSON.h>
+#include <Poco/JSON/Object.h>
+#include <Poco/JSON/Stringifier.h>
 #include <boost/range/adaptor/map.hpp>
 #include <boost/range/algorithm/copy.hpp>
 #include <boost/range/algorithm_ext/push_back.hpp>
@@ -342,9 +345,22 @@ DiskAccessStorage::~DiskAccessStorage()
 }
 
 
-bool DiskAccessStorage::isStoragePathEqual(const String & directory_path_) const
+String DiskAccessStorage::getStorageParamsJSON() const
 {
-    return getStoragePath() == makeDirectoryPathCanonical(directory_path_);
+    std::lock_guard lock{mutex};
+    Poco::JSON::Object json;
+    json.set("path", directory_path);
+    if (readonly)
+        json.set("readonly", readonly.load());
+    std::ostringstream oss;
+    Poco::JSON::Stringifier::stringify(json, oss);
+    return oss.str();
+}
+
+
+bool DiskAccessStorage::isPathEqual(const String & directory_path_) const
+{
+    return getPath() == makeDirectoryPathCanonical(directory_path_);
 }
 
 
diff --git a/src/Access/DiskAccessStorage.h b/src/Access/DiskAccessStorage.h
index f6bef078aba..f1df8e87a03 100644
--- a/src/Access/DiskAccessStorage.h
+++ b/src/Access/DiskAccessStorage.h
@@ -18,12 +18,13 @@ public:
     ~DiskAccessStorage() override;
 
     const char * getStorageType() const override { return STORAGE_TYPE; }
+    String getStorageParamsJSON() const override;
 
-    String getStoragePath() const override { return directory_path; }
-    bool isStoragePathEqual(const String & directory_path_) const;
+    String getPath() const { return directory_path; }
+    bool isPathEqual(const String & directory_path_) const;
 
     void setReadOnly(bool readonly_) { readonly = readonly_; }
-    bool isStorageReadOnly() const override { return readonly; }
+    bool isReadOnly() const { return readonly; }
 
 private:
     std::optional<UUID> findImpl(EntityType type, const String & name) const override;
diff --git a/src/Access/IAccessStorage.h b/src/Access/IAccessStorage.h
index 7851f8c9b6b..6556faa78e5 100644
--- a/src/Access/IAccessStorage.h
+++ b/src/Access/IAccessStorage.h
@@ -25,8 +25,9 @@ public:
     /// Returns the name of this storage.
     const String & getStorageName() const { return storage_name; }
     virtual const char * getStorageType() const = 0;
-    virtual String getStoragePath() const { return {}; }
-    virtual bool isStorageReadOnly() const { return false; }
+
+    /// Returns a JSON with the parameters of the storage. It's up to the storage type to fill the JSON.
+    virtual String getStorageParamsJSON() const { return "{}"; }
 
     using EntityType = IAccessEntity::Type;
     using EntityTypeInfo = IAccessEntity::TypeInfo;
diff --git a/src/Access/UsersConfigAccessStorage.cpp b/src/Access/UsersConfigAccessStorage.cpp
index e4921ffe677..60bcc3784f3 100644
--- a/src/Access/UsersConfigAccessStorage.cpp
+++ b/src/Access/UsersConfigAccessStorage.cpp
@@ -10,6 +10,9 @@
 #include <Core/Settings.h>
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Poco/MD5Engine.h>
+#include <Poco/JSON/JSON.h>
+#include <Poco/JSON/Object.h>
+#include <Poco/JSON/Stringifier.h>
 #include <common/logger_useful.h>
 #include <boost/range/algorithm/copy.hpp>
 #include <boost/range/adaptor/map.hpp>
@@ -482,12 +485,29 @@ UsersConfigAccessStorage::UsersConfigAccessStorage(const String & storage_name_,
 UsersConfigAccessStorage::~UsersConfigAccessStorage() = default;
 
 
-String UsersConfigAccessStorage::getStoragePath() const
+String UsersConfigAccessStorage::getStorageParamsJSON() const
+{
+    std::lock_guard lock{load_mutex};
+    Poco::JSON::Object json;
+    if (!path.empty())
+        json.set("path", path);
+    std::ostringstream oss;
+    Poco::JSON::Stringifier::stringify(json, oss);
+    return oss.str();
+}
+
+
+String UsersConfigAccessStorage::getPath() const
 {
     std::lock_guard lock{load_mutex};
     return path;
 }
 
+bool UsersConfigAccessStorage::isPathEqual(const String & path_) const
+{
+    return getPath() == path_;
+}
+
 
 void UsersConfigAccessStorage::setConfig(const Poco::Util::AbstractConfiguration & config)
 {
diff --git a/src/Access/UsersConfigAccessStorage.h b/src/Access/UsersConfigAccessStorage.h
index 020dfe8f24b..f5302f9987b 100644
--- a/src/Access/UsersConfigAccessStorage.h
+++ b/src/Access/UsersConfigAccessStorage.h
@@ -26,8 +26,10 @@ public:
     ~UsersConfigAccessStorage() override;
 
     const char * getStorageType() const override { return STORAGE_TYPE; }
-    String getStoragePath() const override;
-    bool isStorageReadOnly() const override { return true; }
+    String getStorageParamsJSON() const override;
+
+    String getPath() const;
+    bool isPathEqual(const String & path_) const;
 
     void setConfig(const Poco::Util::AbstractConfiguration & config);
 
diff --git a/src/Storages/System/StorageSystemUserDirectories.cpp b/src/Storages/System/StorageSystemUserDirectories.cpp
index 83e295f2cf2..519f0c0dcb0 100644
--- a/src/Storages/System/StorageSystemUserDirectories.cpp
+++ b/src/Storages/System/StorageSystemUserDirectories.cpp
@@ -15,8 +15,7 @@ NamesAndTypesList StorageSystemUserDirectories::getNamesAndTypes()
     NamesAndTypesList names_and_types{
         {"name", std::make_shared<DataTypeString>()},
         {"type", std::make_shared<DataTypeString>()},
-        {"path", std::make_shared<DataTypeString>()},
-        {"readonly", std::make_shared<DataTypeUInt8>()},
+        {"params", std::make_shared<DataTypeString>()},
         {"precedence", std::make_shared<DataTypeUInt64>()},
     };
     return names_and_types;
@@ -31,21 +30,18 @@ void StorageSystemUserDirectories::fillData(MutableColumns & res_columns, const
     size_t column_index = 0;
     auto & column_name = assert_cast<ColumnString &>(*res_columns[column_index++]);
     auto & column_type = assert_cast<ColumnString &>(*res_columns[column_index++]);
-    auto & column_path = assert_cast<ColumnString &>(*res_columns[column_index++]);
-    auto & column_readonly = assert_cast<ColumnUInt8 &>(*res_columns[column_index++]);
+    auto & column_params = assert_cast<ColumnString &>(*res_columns[column_index++]);
     auto & column_precedence = assert_cast<ColumnUInt64 &>(*res_columns[column_index++]);
 
     auto add_row = [&](const IAccessStorage & storage, size_t precedence)
     {
         const String & name = storage.getStorageName();
         std::string_view type = storage.getStorageType();
-        const String & path = storage.getStoragePath();
-        bool readonly = storage.isStorageReadOnly();
+        String params = storage.getStorageParamsJSON();
 
         column_name.insertData(name.data(), name.length());
         column_type.insertData(type.data(), type.length());
-        column_path.insertData(path.data(), path.length());
-        column_readonly.insert(readonly);
+        column_params.insertData(params.data(), params.length());
         column_precedence.insert(precedence);
     };
 
diff --git a/tests/integration/test_user_directories/test.py b/tests/integration/test_user_directories/test.py
index 71745502064..0a6e037904e 100644
--- a/tests/integration/test_user_directories/test.py
+++ b/tests/integration/test_user_directories/test.py
@@ -24,40 +24,40 @@ def started_cluster():
 def test_old_style():
     node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/old_style.xml"), '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       "/etc/clickhouse-server/users2.xml", 1, 1],
-                                                                       ["local directory", "local directory", "/var/lib/clickhouse/access2/",      0, 2]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users2.xml"}',    1],
+                                                                       ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access2\\\\/"}', 2]])
 
 
 def test_local_directories():
     node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/local_directories.xml"), '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",            "users.xml",       "/etc/clickhouse-server/users3.xml", 1, 1],
-                                                                       ["local directory",      "local directory", "/var/lib/clickhouse/access3/",      0, 2],
-                                                                       ["local directory (ro)", "local directory", "/var/lib/clickhouse/access3-ro/",   1, 3]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",            "users.xml",       '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users3.xml"}',                       1],
+                                                                       ["local directory",      "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access3\\\\/"}',                    2],
+                                                                       ["local directory (ro)", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access3-ro\\\\/","readonly":true}', 3]])
 
 
 def test_relative_path():
     node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/relative_path.xml"), '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml", "users.xml", "/etc/clickhouse-server/users4.xml", 1, 1]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users4.xml"}', 1]])
 
 
 def test_memory():
     node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/memory.xml"), '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml", "users.xml", "/etc/clickhouse-server/users5.xml", 1, 1],
-                                                                       ["memory",    "memory",    "",                                  0, 2]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users5.xml"}', 1],
+                                                                       ["memory",    "memory",    '{}',                                                       2]])
 
 def test_mixed_style():
     node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/mixed_style.xml"), '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       "/etc/clickhouse-server/users6.xml", 1, 1],
-                                                                       ["local directory", "local directory", "/var/lib/clickhouse/access6/",      0, 2],
-                                                                       ["local directory", "local directory", "/var/lib/clickhouse/access6a/",     0, 3],
-                                                                       ["memory",          "memory",          "",                                  0, 4]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users6.xml"}',     1],
+                                                                       ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access6\\\\/"}',  2],
+                                                                       ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access6a\\\\/"}', 3],
+                                                                       ["memory",          "memory",          '{}',                                                           4]])
 
 def test_duplicates():
     node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/duplicates.xml"), '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       "/etc/clickhouse-server/users7.xml", 1, 1],
-                                                                       ["local directory", "local directory", "/var/lib/clickhouse/access7/",      0, 2]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users7.xml"}',    1],
+                                                                       ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access7\\\\/"}', 2]])

From 95ae1105d9e5132fc79c3c21e800469dc4c762b1 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 02:05:43 +0300
Subject: [PATCH 224/341] Remove virtual destructors for Visitor.

---
 src/Common/Visitor.h                          | 19 ++++++++++++++++++-
 src/Functions/GatherUtils/ArraySinkVisitor.h  |  4 ++--
 .../GatherUtils/ArraySourceVisitor.h          |  4 ++--
 src/Functions/GatherUtils/Selectors.h         |  6 +++---
 .../GatherUtils/ValueSourceVisitor.h          |  4 ++--
 5 files changed, 27 insertions(+), 10 deletions(-)

diff --git a/src/Common/Visitor.h b/src/Common/Visitor.h
index 7aef573a566..26ee66681e9 100644
--- a/src/Common/Visitor.h
+++ b/src/Common/Visitor.h
@@ -66,7 +66,8 @@ class Visitor<>
 public:
     using List = TypeList<>;
 
-    virtual ~Visitor() = default;
+protected:
+    ~Visitor() = default;
 };
 
 template <typename Type>
@@ -76,6 +77,9 @@ public:
     using List = TypeList<Type>;
 
     virtual void visit(Type &) = 0;
+
+protected:
+    ~Visitor() = default;
 };
 
 template <typename Type, typename ... Types>
@@ -86,6 +90,9 @@ public:
     using Visitor<Types ...>::visit;
 
     virtual void visit(Type &) = 0;
+
+protected:
+    ~Visitor() = default;
 };
 
 
@@ -95,6 +102,8 @@ class VisitorImplHelper;
 template <typename Derived, typename VisitorBase>
 class VisitorImplHelper<Derived, VisitorBase> : public VisitorBase
 {
+protected:
+    ~VisitorImplHelper() = default;
 };
 
 template <typename Derived, typename VisitorBase, typename Type>
@@ -111,6 +120,8 @@ protected:
         throw Exception("visitImpl(" + demangle(typeid(T).name()) + " &)" + " is not implemented for class"
                         + demangle(typeid(Derived).name()), ErrorCodes::LOGICAL_ERROR);
     }
+
+    ~VisitorImplHelper() = default;
 };
 
 template <typename Derived, typename VisitorBase, typename Type, typename ... Types>
@@ -128,6 +139,8 @@ protected:
         throw Exception("visitImpl(" + demangle(typeid(T).name()) + " &)" + " is not implemented for class"
                         + demangle(typeid(Derived).name()), ErrorCodes::LOGICAL_ERROR);
     }
+
+    ~VisitorImplHelper() = default;
 };
 
 template <typename Derived, typename VisitorBase>
@@ -140,6 +153,8 @@ class VisitorImpl : public
                 >::Type
         >::Type
 {
+protected:
+    ~VisitorImpl() = default;
 };
 
 template <typename Derived, typename Base, typename Visitor>
@@ -147,6 +162,8 @@ class Visitable : public Base
 {
 public:
     void accept(Visitor & visitor) override { visitor.visit(*static_cast<Derived *>(this)); }
+
+    //virtual ~Visitable() = default;
 };
 
 }
diff --git a/src/Functions/GatherUtils/ArraySinkVisitor.h b/src/Functions/GatherUtils/ArraySinkVisitor.h
index 1109b40f5da..addb231539a 100644
--- a/src/Functions/GatherUtils/ArraySinkVisitor.h
+++ b/src/Functions/GatherUtils/ArraySinkVisitor.h
@@ -19,10 +19,10 @@ using BasicArraySinks = typename AppendToTypeList<GenericArraySink, NumericArray
 using NullableArraySinks = typename TypeListMap<NullableArraySink, BasicArraySinks>::Type;
 using TypeListArraySinks = typename TypeListConcat<BasicArraySinks, NullableArraySinks>::Type;
 
-class ArraySinkVisitor : public ApplyTypeListForClass<Visitor, TypeListArraySinks>::Type {};
+using ArraySinkVisitor = typename ApplyTypeListForClass<Visitor, TypeListArraySinks>::Type;
 
 template <typename Derived>
-class ArraySinkVisitorImpl : public VisitorImpl<Derived, ArraySinkVisitor> {};
+using ArraySinkVisitorImpl = VisitorImpl<Derived, ArraySinkVisitor>;
 
 #pragma GCC visibility pop
 }
diff --git a/src/Functions/GatherUtils/ArraySourceVisitor.h b/src/Functions/GatherUtils/ArraySourceVisitor.h
index 98f7338ee12..59c8ea839a5 100644
--- a/src/Functions/GatherUtils/ArraySourceVisitor.h
+++ b/src/Functions/GatherUtils/ArraySourceVisitor.h
@@ -24,10 +24,10 @@ using BasicAndNullableArraySources = typename TypeListConcat<BasicArraySources,
 using ConstArraySources = typename TypeListMap<ConstSource, BasicAndNullableArraySources>::Type;
 using TypeListArraySources = typename TypeListConcat<BasicAndNullableArraySources, ConstArraySources>::Type;
 
-class ArraySourceVisitor : public ApplyTypeListForClass<Visitor, TypeListArraySources>::Type {};
+using ArraySourceVisitor = typename ApplyTypeListForClass<Visitor, TypeListArraySources>::Type;
 
 template <typename Derived>
-class ArraySourceVisitorImpl : public VisitorImpl<Derived, ArraySourceVisitor> {};
+using ArraySourceVisitorImpl = VisitorImpl<Derived, ArraySourceVisitor>;
 
 #pragma GCC visibility pop
 }
diff --git a/src/Functions/GatherUtils/Selectors.h b/src/Functions/GatherUtils/Selectors.h
index 4b32735b6a1..9c96b36460d 100644
--- a/src/Functions/GatherUtils/Selectors.h
+++ b/src/Functions/GatherUtils/Selectors.h
@@ -33,7 +33,7 @@ void callSelectMemberFunctionWithTupleArgument(Tuple & tuple, Args && ... args)
 }
 
 template <typename Base, typename ... Args>
-struct ArraySourceSelectorVisitor : public ArraySourceVisitorImpl<ArraySourceSelectorVisitor<Base, Args ...>>
+struct ArraySourceSelectorVisitor final : public ArraySourceVisitorImpl<ArraySourceSelectorVisitor<Base, Args ...>>
 {
     explicit ArraySourceSelectorVisitor(Args && ... args) : packed_args(args ...) {}
 
@@ -61,7 +61,7 @@ struct ArraySourceSelector
 
 
 template <typename Base, typename ... Args>
-struct ArraySinkSelectorVisitor : public ArraySinkVisitorImpl<ArraySinkSelectorVisitor<Base, Args ...>>
+struct ArraySinkSelectorVisitor final : public ArraySinkVisitorImpl<ArraySinkSelectorVisitor<Base, Args ...>>
 {
     explicit ArraySinkSelectorVisitor(Args && ... args) : packed_args(args ...) {}
 
@@ -89,7 +89,7 @@ struct ArraySinkSelector
 
 
 template <typename Base, typename ... Args>
-struct ValueSourceSelectorVisitor : public ValueSourceVisitorImpl<ValueSourceSelectorVisitor<Base, Args ...>>
+struct ValueSourceSelectorVisitor final : public ValueSourceVisitorImpl<ValueSourceSelectorVisitor<Base, Args ...>>
 {
     explicit ValueSourceSelectorVisitor(Args && ... args) : packed_args(args ...) {}
 
diff --git a/src/Functions/GatherUtils/ValueSourceVisitor.h b/src/Functions/GatherUtils/ValueSourceVisitor.h
index 63f94ea29e3..74be08cb4dd 100644
--- a/src/Functions/GatherUtils/ValueSourceVisitor.h
+++ b/src/Functions/GatherUtils/ValueSourceVisitor.h
@@ -24,10 +24,10 @@ using BasicAndNullableValueSources = typename TypeListConcat<BasicValueSources,
 using ConstValueSources = typename TypeListMap<ConstSource, BasicAndNullableValueSources>::Type;
 using TypeListValueSources = typename TypeListConcat<BasicAndNullableValueSources, ConstValueSources>::Type;
 
-class ValueSourceVisitor : public ApplyTypeListForClass<Visitor, TypeListValueSources>::Type {};
+using ValueSourceVisitor = typename ApplyTypeListForClass<Visitor, TypeListValueSources>::Type;
 
 template <typename Derived>
-class ValueSourceVisitorImpl : public VisitorImpl<Derived, ValueSourceVisitor> {};
+using ValueSourceVisitorImpl = VisitorImpl<Derived, ValueSourceVisitor>;
 
 #pragma GCC visibility pop
 }

From 4770175aa337b6c658189a654bd44ecdb7219ac8 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Tue, 15 Sep 2020 10:02:26 +0800
Subject: [PATCH 225/341] more tests

---
 ...480_binary_operator_monotonicity.reference |  8 ++++
 .../01480_binary_operator_monotonicity.sql    | 45 ++++++++++++++++---
 2 files changed, 48 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/01480_binary_operator_monotonicity.reference b/tests/queries/0_stateless/01480_binary_operator_monotonicity.reference
index e69de29bb2d..405d3348775 100644
--- a/tests/queries/0_stateless/01480_binary_operator_monotonicity.reference
+++ b/tests/queries/0_stateless/01480_binary_operator_monotonicity.reference
@@ -0,0 +1,8 @@
+0
+0
+0
+0
+0
+0
+0
+0
diff --git a/tests/queries/0_stateless/01480_binary_operator_monotonicity.sql b/tests/queries/0_stateless/01480_binary_operator_monotonicity.sql
index bfaab3abd3c..20c3b542e18 100644
--- a/tests/queries/0_stateless/01480_binary_operator_monotonicity.sql
+++ b/tests/queries/0_stateless/01480_binary_operator_monotonicity.sql
@@ -1,10 +1,45 @@
-DROP TABLE IF EXISTS binary_op_mono;
+DROP TABLE IF EXISTS binary_op_mono1;
+DROP TABLE IF EXISTS binary_op_mono2;
+DROP TABLE IF EXISTS binary_op_mono3;
+DROP TABLE IF EXISTS binary_op_mono4;
+DROP TABLE IF EXISTS binary_op_mono5;
+DROP TABLE IF EXISTS binary_op_mono6;
+DROP TABLE IF EXISTS binary_op_mono7;
+DROP TABLE IF EXISTS binary_op_mono8;
 
-CREATE TABLE binary_op_mono(i int, j int) ENGINE MergeTree PARTITION BY toDate(i / 1000) ORDER BY j;
+CREATE TABLE binary_op_mono1(i int, j int) ENGINE MergeTree PARTITION BY toDate(i / 1000) ORDER BY j;
+CREATE TABLE binary_op_mono2(i int, j int) ENGINE MergeTree PARTITION BY 1000 / i ORDER BY j;
+CREATE TABLE binary_op_mono3(i int, j int) ENGINE MergeTree PARTITION BY i + 1000 ORDER BY j;
+CREATE TABLE binary_op_mono4(i int, j int) ENGINE MergeTree PARTITION BY 1000 + i ORDER BY j;
+CREATE TABLE binary_op_mono5(i int, j int) ENGINE MergeTree PARTITION BY i - 1000 ORDER BY j;
+CREATE TABLE binary_op_mono6(i int, j int) ENGINE MergeTree PARTITION BY 1000 - i ORDER BY j;
+CREATE TABLE binary_op_mono7(i int, j int) ENGINE MergeTree PARTITION BY i / 1000.0 ORDER BY j;
+CREATE TABLE binary_op_mono8(i int, j int) ENGINE MergeTree PARTITION BY 1000.0 / i ORDER BY j;
 
-INSERT INTO binary_op_mono VALUES (toUnixTimestamp('2020-09-01 00:00:00') * 1000, 1), (toUnixTimestamp('2020-09-01 00:00:00') * 1000, 2);
+INSERT INTO binary_op_mono1 VALUES (toUnixTimestamp('2020-09-01 00:00:00') * 1000, 1), (toUnixTimestamp('2020-09-01 00:00:00') * 1000, 2);
+INSERT INTO binary_op_mono2 VALUES (1, 1), (10000, 2);
+INSERT INTO binary_op_mono3 VALUES (1, 1), (10000, 2);
+INSERT INTO binary_op_mono4 VALUES (1, 1), (10000, 2);
+INSERT INTO binary_op_mono5 VALUES (1, 1), (10000, 2);
+INSERT INTO binary_op_mono6 VALUES (1, 1), (10000, 2);
+INSERT INTO binary_op_mono7 VALUES (1, 1), (10000, 2);
+INSERT INTO binary_op_mono8 VALUES (1, 1), (10000, 2);
 
 SET max_rows_to_read = 1;
-SELECT * FROM binary_op_mono WHERE toDate(i / 1000) = '2020-09-02';
+SELECT count() FROM binary_op_mono1 WHERE toDate(i / 1000) = '2020-09-02';
+SELECT count() FROM binary_op_mono2 WHERE 1000 / i = 100;
+SELECT count() FROM binary_op_mono3 WHERE i + 1000 = 500;
+SELECT count() FROM binary_op_mono4 WHERE 1000 + i = 500;
+SELECT count() FROM binary_op_mono5 WHERE i - 1000 = 1234;
+SELECT count() FROM binary_op_mono6 WHERE 1000 - i = 1234;
+SELECT count() FROM binary_op_mono7 WHERE i / 1000.0 = 22.3;
+SELECT count() FROM binary_op_mono8 WHERE 1000.0 / i = 33.4;
 
-DROP TABLE IF EXISTS binary_op_mono;
+DROP TABLE IF EXISTS binary_op_mono1;
+DROP TABLE IF EXISTS binary_op_mono2;
+DROP TABLE IF EXISTS binary_op_mono3;
+DROP TABLE IF EXISTS binary_op_mono4;
+DROP TABLE IF EXISTS binary_op_mono5;
+DROP TABLE IF EXISTS binary_op_mono6;
+DROP TABLE IF EXISTS binary_op_mono7;
+DROP TABLE IF EXISTS binary_op_mono8;

From e4e310501447bf0cdea238b984044f7762126bd0 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Mon, 14 Sep 2020 19:37:44 -0700
Subject: [PATCH 226/341] Construct query_start_time(_microseconds) from same
 timespec

---
 src/Interpreters/ThreadStatusExt.cpp | 11 ++++++++---
 src/Interpreters/executeQuery.cpp    | 11 +++++++++--
 2 files changed, 17 insertions(+), 5 deletions(-)

diff --git a/src/Interpreters/ThreadStatusExt.cpp b/src/Interpreters/ThreadStatusExt.cpp
index 34efdda9097..5766472156a 100644
--- a/src/Interpreters/ThreadStatusExt.cpp
+++ b/src/Interpreters/ThreadStatusExt.cpp
@@ -146,9 +146,14 @@ void ThreadStatus::initPerformanceCounters()
     memory_tracker.resetCounters();
     memory_tracker.setDescription("(for thread)");
 
-    query_start_time_nanoseconds = getCurrentTimeNanoseconds();
-    query_start_time = time(nullptr);
-    query_start_time_microseconds = getCurrentTimeMicroseconds();
+    // query_start_time_{microseconds, nanoseconds} are all constructed from the same timespec
+    // to ensure that they are all atelast equal upto the precision of a second.
+    struct timespec ts;
+    clock_gettime(CLOCK_MONOTONIC, &ts);
+
+    query_start_time_nanoseconds = UInt64(ts.tv_sec * 1000000000LL + ts.tv_nsec);
+    query_start_time = ts.tv_sec;
+    query_start_time_microseconds = UInt64((ts.tv_sec * 1000000LL) + (ts.tv_nsec / 1000));
     ++queries_started;
 
     *last_rusage = RUsageCounters::current(query_start_time_nanoseconds);
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 478eed65ae1..be18fb20d29 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -196,6 +196,8 @@ static void onExceptionBeforeStart(const String & query_for_logging, Context & c
 
     elem.type = QueryLogElementType::EXCEPTION_BEFORE_START;
 
+    // the assumption here is that the callers of onExceptionBeforeStart construct both params current_time and the current_time_microseconds
+    // from the same timespec so that both of the times are equal upto the precision of a second.
     elem.event_time = current_time;
     elem.query_start_time = current_time;
     elem.query_start_time_microseconds = current_time_microseconds;
@@ -251,8 +253,13 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
     bool has_query_tail,
     ReadBuffer * istr)
 {
-    time_t current_time = time(nullptr);
-    UInt64 current_time_microseconds = getCurrentTimeMicroseconds();
+    // current_time and current_time_microseconds are both constructed from the same timespec
+    // to ensure that both the times are equal upto the precision of a second.
+    struct timespec ts;
+    clock_gettime(CLOCK_MONOTONIC, &ts);
+
+    time_t current_time = ts.tv_sec;
+    UInt64 current_time_microseconds = UInt64((ts.tv_sec * 1000000LL) + (ts.tv_nsec / 1000));
 
     /// If we already executing query and it requires to execute internal query, than
     /// don't replace thread context with given (it can be temporary). Otherwise, attach context to thread.

From 90e0ef9b70e2135dcb2a781cade56cf0d89cec8a Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Mon, 14 Sep 2020 19:43:47 -0700
Subject: [PATCH 227/341] QueryLog,QueryThreadLOg - better test for
 query_start_time_microseconds

---
 .../01461_query_start_time_microseconds.sql   | 43 +++++++++++++++----
 1 file changed, 35 insertions(+), 8 deletions(-)

diff --git a/tests/queries/0_stateless/01461_query_start_time_microseconds.sql b/tests/queries/0_stateless/01461_query_start_time_microseconds.sql
index 56af94bfd73..bf56fefd841 100644
--- a/tests/queries/0_stateless/01461_query_start_time_microseconds.sql
+++ b/tests/queries/0_stateless/01461_query_start_time_microseconds.sql
@@ -1,9 +1,36 @@
-set log_queries = 1;
+SET log_queries = 1;
+SELECT '01461_query_log_query_start_time_milliseconds_test';
+SYSTEM FLUSH LOGS;
+-- assumes that the query_start_time field is already accurate.
+WITH (
+      (
+          SELECT query_start_time_microseconds
+          FROM system.query_log
+          ORDER BY query_start_time DESC
+          LIMIT 1
+      ) AS time_with_microseconds,
+      (
+          SELECT query_start_time
+          FROM system.query_log
+          ORDER BY query_start_time DESC
+          LIMIT 1
+      ) AS t)
+SELECT if(dateDiff('second', toDateTime(time_with_microseconds), toDateTime(t)) = 0, 'ok', 'fail'); --
 
-select '01461_query_log_query_start_time_milliseconds_test';
-system flush logs;
-SELECT If((select count(query_start_time_microseconds)  from system.query_log WHERE query LIKE  '%01461_query_log_query_start_time_milliseconds_test%' AND query NOT LIKE '%system.query_log%') > 0, 'ok', 'fail');
-
-select '01461_query_thread_log_query_start_time_milliseconds_test';
-system flush logs;
-SELECT If((select count(query_start_time_microseconds)  from system.query_log WHERE query LIKE  '%01461_query_thread_log_query_start_time_milliseconds_test%' AND query NOT LIKE '%system.query_log%') > 0, 'ok', 'fail');
+SELECT '01461_query_thread_log_query_start_time_milliseconds_test';
+SYSTEM FLUSH LOGS;
+-- assumes that the query_start_time field is already accurate.
+WITH (
+      (
+          SELECT query_start_time_microseconds
+          FROM system.query_thread_log
+          ORDER BY query_start_time DESC
+          LIMIT 1
+      ) AS time_with_microseconds,
+      (
+          SELECT query_start_time
+          FROM system.query_thread_log
+          ORDER BY query_start_time DESC
+          LIMIT 1
+      ) AS t)
+SELECT if(dateDiff('second', toDateTime(time_with_microseconds), toDateTime(t)) = 0, 'ok', 'fail'); --
\ No newline at end of file

From c044c040a8ab60a5cefc72df1305a4648f00aeab Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 09:53:14 +0300
Subject: [PATCH 228/341] Fix build.

---
 src/Functions/GatherUtils/Algorithms.h | 54 +++++++++++++-------------
 1 file changed, 27 insertions(+), 27 deletions(-)

diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index d3fa018e3d5..e1e00f66c56 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -187,7 +187,7 @@ inline ALWAYS_INLINE void writeSlice(const NumericValueSlice<T> & slice, Generic
 
 
 template <typename SourceA, typename SourceB, typename Sink>
-void ALWAYS_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sink)
+void inline ALWAYS_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sink)
 {
     sink.reserve(src_a.getSizeForReserve() + src_b.getSizeForReserve());
 
@@ -203,7 +203,7 @@ void ALWAYS_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sink)
 }
 
 template <typename Source, typename Sink>
-void ALWAYS_INLINE concat(const std::vector<std::unique_ptr<IArraySource>> & array_sources, Sink && sink)
+void inline ALWAYS_INLINE concat(const std::vector<std::unique_ptr<IArraySource>> & array_sources, Sink && sink)
 {
     size_t sources_num = array_sources.size();
     std::vector<char> is_const(sources_num);
@@ -251,7 +251,7 @@ void ALWAYS_INLINE concat(const std::vector<std::unique_ptr<IArraySource>> & arr
 }
 
 template <typename Sink>
-void ALWAYS_INLINE concat(StringSources & sources, Sink && sink)
+void inline ALWAYS_INLINE concat(StringSources & sources, Sink && sink)
 {
     while (!sink.isEnd())
     {
@@ -266,7 +266,7 @@ void ALWAYS_INLINE concat(StringSources & sources, Sink && sink)
 
 
 template <typename Source, typename Sink>
-void ALWAYS_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
+void inline ALWAYS_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
 {
     while (!src.isEnd())
     {
@@ -277,7 +277,7 @@ void ALWAYS_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Sink && s
 }
 
 template <typename Source, typename Sink>
-void ALWAYS_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
+void inline ALWAYS_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
 {
     while (!src.isEnd())
     {
@@ -294,7 +294,7 @@ void ALWAYS_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink && sin
 }
 
 template <typename Source, typename Sink>
-void ALWAYS_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
+void inline ALWAYS_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
 {
     while (!src.isEnd())
     {
@@ -305,7 +305,7 @@ void ALWAYS_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, Sink &&
 }
 
 template <typename Source, typename Sink>
-void ALWAYS_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
+void inline ALWAYS_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
 {
     while (!src.isEnd())
     {
@@ -322,7 +322,7 @@ void ALWAYS_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sink && si
 }
 
 template <typename Source, typename Sink>
-void ALWAYS_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sink, const IColumn & offset_column)
+void inline ALWAYS_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sink, const IColumn & offset_column)
 {
     const bool is_null = offset_column.onlyNull();
     const auto * nullable = typeid_cast<const ColumnNullable *>(&offset_column);
@@ -353,7 +353,7 @@ void ALWAYS_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sink, cons
 }
 
 template <typename Source, typename Sink>
-void ALWAYS_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink, const IColumn & offset_column, const IColumn & length_column)
+void inline ALWAYS_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink, const IColumn & offset_column, const IColumn & length_column)
 {
     const bool is_offset_null = offset_column.onlyNull();
     const auto * offset_nullable = typeid_cast<const ColumnNullable *>(&offset_column);
@@ -423,7 +423,7 @@ template <
     typename FirstSliceType,
     typename SecondSliceType,
           bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t)>
-bool ALWAYS_INLINE sliceHasImplAnyAll(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool inline ALWAYS_INLINE sliceHasImplAnyAll(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     const bool has_first_null_map = first_null_map != nullptr;
     const bool has_second_null_map = second_null_map != nullptr;
@@ -457,7 +457,7 @@ bool ALWAYS_INLINE sliceHasImplAnyAll(const FirstSliceType & first, const Second
 /// https://en.wikipedia.org/wiki/Knuth%E2%80%93Morris%E2%80%93Pratt_algorithm.
 /// A "prefix-function" is defined as: i-th element is the length of the longest of all prefixes that end in i-th position
 template <typename SliceType, typename EqualityFunc>
-std::vector<size_t> ALWAYS_INLINE buildKMPPrefixFunction(const SliceType & pattern, const EqualityFunc & isEqualFunc)
+std::vector<size_t> inline ALWAYS_INLINE buildKMPPrefixFunction(const SliceType & pattern, const EqualityFunc & isEqualFunc)
 {
     std::vector<size_t> result(pattern.size);
     result[0] = 0;
@@ -484,7 +484,7 @@ template < typename FirstSliceType,
            typename SecondSliceType,
            bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t),
            bool (*isEqualUnary)(const SecondSliceType &, size_t, size_t)>
-bool ALWAYS_INLINE sliceHasImplSubstr(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool inline ALWAYS_INLINE sliceHasImplSubstr(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     if (second.size == 0)
         return true;
@@ -541,7 +541,7 @@ template <
     typename SecondSliceType,
     bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t),
     bool (*isEqualSecond)(const SecondSliceType &, size_t, size_t)>
-bool ALWAYS_INLINE sliceHasImpl(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool inline ALWAYS_INLINE sliceHasImpl(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     if constexpr (search_type == ArraySearchType::Substr)
         return sliceHasImplSubstr<FirstSliceType, SecondSliceType, isEqual, isEqualSecond>(first, second, first_null_map, second_null_map);
@@ -551,7 +551,7 @@ bool ALWAYS_INLINE sliceHasImpl(const FirstSliceType & first, const SecondSliceT
 
 
 template <typename T, typename U>
-bool ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
+bool inline ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
                         const NumericArraySlice<U> & second [[maybe_unused]],
                         size_t first_ind [[maybe_unused]],
                         size_t second_ind [[maybe_unused]])
@@ -566,13 +566,13 @@ bool ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> & first [[maybe
 }
 
 template <typename T>
-bool ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> &, const GenericArraySlice &, size_t, size_t)
+bool inline ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> &, const GenericArraySlice &, size_t, size_t)
 {
     return false;
 }
 
 template <typename U>
-bool ALWAYS_INLINE sliceEqualElements(const GenericArraySlice &, const NumericArraySlice<U> &, size_t, size_t)
+bool inline ALWAYS_INLINE sliceEqualElements(const GenericArraySlice &, const NumericArraySlice<U> &, size_t, size_t)
 {
     return false;
 }
@@ -583,7 +583,7 @@ inline ALWAYS_INLINE bool sliceEqualElements(const GenericArraySlice & first, co
 }
 
 template <typename T>
-bool ALWAYS_INLINE insliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
+bool inline ALWAYS_INLINE insliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
                           size_t first_ind [[maybe_unused]],
                           size_t second_ind [[maybe_unused]])
 {
@@ -598,14 +598,14 @@ inline ALWAYS_INLINE bool insliceEqualElements(const GenericArraySlice & first,
 }
 
 template <ArraySearchType search_type, typename T, typename U>
-bool ALWAYS_INLINE sliceHas(const NumericArraySlice<T> & first, const NumericArraySlice<U> & second)
+bool inline ALWAYS_INLINE sliceHas(const NumericArraySlice<T> & first, const NumericArraySlice<U> & second)
 {
     auto impl = sliceHasImpl<search_type, NumericArraySlice<T>, NumericArraySlice<U>, sliceEqualElements<T, U>, insliceEqualElements<U>>;
     return impl(first, second, nullptr, nullptr);
 }
 
 template <ArraySearchType search_type>
-bool ALWAYS_INLINE sliceHas(const GenericArraySlice & first, const GenericArraySlice & second)
+bool inline ALWAYS_INLINE sliceHas(const GenericArraySlice & first, const GenericArraySlice & second)
 {
     /// Generic arrays should have the same type in order to use column.compareAt(...)
     if (!first.elements->structureEquals(*second.elements))
@@ -616,19 +616,19 @@ bool ALWAYS_INLINE sliceHas(const GenericArraySlice & first, const GenericArrayS
 }
 
 template <ArraySearchType search_type, typename U>
-bool ALWAYS_INLINE sliceHas(const GenericArraySlice & /*first*/, const NumericArraySlice<U> & /*second*/)
+bool inline ALWAYS_INLINE sliceHas(const GenericArraySlice & /*first*/, const NumericArraySlice<U> & /*second*/)
 {
     return false;
 }
 
 template <ArraySearchType search_type, typename T>
-bool ALWAYS_INLINE sliceHas(const NumericArraySlice<T> & /*first*/, const GenericArraySlice & /*second*/)
+bool inline ALWAYS_INLINE sliceHas(const NumericArraySlice<T> & /*first*/, const GenericArraySlice & /*second*/)
 {
     return false;
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool ALWAYS_INLINE sliceHas(const FirstArraySlice & first, NullableSlice<SecondArraySlice> & second)
+bool inline ALWAYS_INLINE sliceHas(const FirstArraySlice & first, NullableSlice<SecondArraySlice> & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -640,7 +640,7 @@ bool ALWAYS_INLINE sliceHas(const FirstArraySlice & first, NullableSlice<SecondA
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, SecondArraySlice & second)
+bool inline ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, SecondArraySlice & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -652,7 +652,7 @@ bool ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, Second
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, NullableSlice<SecondArraySlice> & second)
+bool inline ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, NullableSlice<SecondArraySlice> & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -664,7 +664,7 @@ bool ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, Nullab
 }
 
 template <ArraySearchType search_type, typename FirstSource, typename SecondSource>
-void ALWAYS_INLINE arrayAllAny(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
+void inline ALWAYS_INLINE arrayAllAny(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
 {
     auto size = result.size();
     auto & data = result.getData();
@@ -677,7 +677,7 @@ void ALWAYS_INLINE arrayAllAny(FirstSource && first, SecondSource && second, Col
 }
 
 template <typename ArraySource, typename ValueSource, typename Sink>
-void ALWAYS_INLINE resizeDynamicSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const IColumn & size_column)
+void inline ALWAYS_INLINE resizeDynamicSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const IColumn & size_column)
 {
     const auto * size_nullable = typeid_cast<const ColumnNullable *>(&size_column);
     const NullMap * size_null_map = size_nullable ? &size_nullable->getNullMapData() : nullptr;
@@ -736,7 +736,7 @@ void ALWAYS_INLINE resizeDynamicSize(ArraySource && array_source, ValueSource &&
 }
 
 template <typename ArraySource, typename ValueSource, typename Sink>
-void ALWAYS_INLINE resizeConstantSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const ssize_t size)
+void inline ALWAYS_INLINE resizeConstantSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const ssize_t size)
 {
     while (!sink.isEnd())
     {

From 2e7da0e2f98e895513c66ff15f976c91eaa0f3a2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 09:56:49 +0300
Subject: [PATCH 229/341] Fix build.

---
 src/Functions/GatherUtils/ArraySinkVisitor.h   | 12 ++++++++++--
 src/Functions/GatherUtils/ArraySourceVisitor.h | 12 ++++++++++--
 2 files changed, 20 insertions(+), 4 deletions(-)

diff --git a/src/Functions/GatherUtils/ArraySinkVisitor.h b/src/Functions/GatherUtils/ArraySinkVisitor.h
index addb231539a..b146780924f 100644
--- a/src/Functions/GatherUtils/ArraySinkVisitor.h
+++ b/src/Functions/GatherUtils/ArraySinkVisitor.h
@@ -19,10 +19,18 @@ using BasicArraySinks = typename AppendToTypeList<GenericArraySink, NumericArray
 using NullableArraySinks = typename TypeListMap<NullableArraySink, BasicArraySinks>::Type;
 using TypeListArraySinks = typename TypeListConcat<BasicArraySinks, NullableArraySinks>::Type;
 
-using ArraySinkVisitor = typename ApplyTypeListForClass<Visitor, TypeListArraySinks>::Type;
+class ArraySinkVisitor : public ApplyTypeListForClass<Visitor, TypeListArraySinks>::Type
+{
+protected:
+    ~ArraySinkVisitor() = default;
+};
 
 template <typename Derived>
-using ArraySinkVisitorImpl = VisitorImpl<Derived, ArraySinkVisitor>;
+class ArraySinkVisitorImpl : public VisitorImpl<Derived, ArraySinkVisitor>
+{
+protected:
+    ~ArraySinkVisitorImpl() = default;
+};
 
 #pragma GCC visibility pop
 }
diff --git a/src/Functions/GatherUtils/ArraySourceVisitor.h b/src/Functions/GatherUtils/ArraySourceVisitor.h
index 59c8ea839a5..989f9ae918a 100644
--- a/src/Functions/GatherUtils/ArraySourceVisitor.h
+++ b/src/Functions/GatherUtils/ArraySourceVisitor.h
@@ -24,10 +24,18 @@ using BasicAndNullableArraySources = typename TypeListConcat<BasicArraySources,
 using ConstArraySources = typename TypeListMap<ConstSource, BasicAndNullableArraySources>::Type;
 using TypeListArraySources = typename TypeListConcat<BasicAndNullableArraySources, ConstArraySources>::Type;
 
-using ArraySourceVisitor = typename ApplyTypeListForClass<Visitor, TypeListArraySources>::Type;
+class ArraySourceVisitor : public ApplyTypeListForClass<Visitor, TypeListArraySources>::Type
+{
+protected:
+    ~ArraySourceVisitor() = default;
+};
 
 template <typename Derived>
-using ArraySourceVisitorImpl = VisitorImpl<Derived, ArraySourceVisitor>;
+class ArraySourceVisitorImpl : public VisitorImpl<Derived, ArraySourceVisitor>
+{
+protected:
+    ~ArraySourceVisitorImpl() = default;
+};
 
 #pragma GCC visibility pop
 }

From fe9c451966e11c2316657dccad78b2a26d837cce Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 10:20:34 +0300
Subject: [PATCH 230/341] Fix build.

---
 src/Functions/GatherUtils/ValueSourceVisitor.h | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/src/Functions/GatherUtils/ValueSourceVisitor.h b/src/Functions/GatherUtils/ValueSourceVisitor.h
index 74be08cb4dd..538ee156e5d 100644
--- a/src/Functions/GatherUtils/ValueSourceVisitor.h
+++ b/src/Functions/GatherUtils/ValueSourceVisitor.h
@@ -24,10 +24,18 @@ using BasicAndNullableValueSources = typename TypeListConcat<BasicValueSources,
 using ConstValueSources = typename TypeListMap<ConstSource, BasicAndNullableValueSources>::Type;
 using TypeListValueSources = typename TypeListConcat<BasicAndNullableValueSources, ConstValueSources>::Type;
 
-using ValueSourceVisitor = typename ApplyTypeListForClass<Visitor, TypeListValueSources>::Type;
+class ValueSourceVisitor : public ApplyTypeListForClass<Visitor, TypeListValueSources>::Type
+{
+protected:
+    ~ValueSourceVisitor() = default;
+};
 
 template <typename Derived>
-using ValueSourceVisitorImpl = VisitorImpl<Derived, ValueSourceVisitor>;
+class ValueSourceVisitorImpl : public VisitorImpl<Derived, ValueSourceVisitor>
+{
+protected:
+    ~ValueSourceVisitorImpl() = default;
+};
 
 #pragma GCC visibility pop
 }

From 8c2aa7ce8c408d021de03c2b6a784bfb5ce255db Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 12:22:45 +0300
Subject: [PATCH 231/341] Added comment.

---
 src/Storages/IStorage.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Storages/IStorage.h b/src/Storages/IStorage.h
index 0b770eed81b..02262a67e8f 100644
--- a/src/Storages/IStorage.h
+++ b/src/Storages/IStorage.h
@@ -281,6 +281,8 @@ public:
         size_t /*max_block_size*/,
         unsigned /*num_streams*/);
 
+    /// Other version of read which adds reading step to query plan.
+    /// Default implementation creates ReadFromStorageStep and uses usual read.
     virtual void read(
         QueryPlan & query_plan,
         TableLockHolder table_lock,

From 01ab28a1829db26a89d63f67b2a42743dc5364ab Mon Sep 17 00:00:00 2001
From: Pavel Kovalenko <jokserfn@yandex-team.ru>
Date: Tue, 15 Sep 2020 12:26:56 +0300
Subject: [PATCH 232/341] Don't throw exception if Distributed storage has
 multi-volume storage policy configuration.

---
 src/Storages/StorageDistributed.cpp | 14 ++++++++------
 src/Storages/StorageDistributed.h   |  5 +++++
 2 files changed, 13 insertions(+), 6 deletions(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 703bb6dcb96..1d2ba88d3d4 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -380,8 +380,10 @@ StorageDistributed::StorageDistributed(
     if (!relative_data_path.empty())
     {
         storage_policy = global_context->getStoragePolicy(storage_policy_name_);
-        if (storage_policy->getVolumes().size() != 1)
-            throw Exception("Storage policy for Distributed table, should have exactly one volume", ErrorCodes::BAD_ARGUMENTS);
+        data_volume = storage_policy->getVolume(0);
+        if (storage_policy->getVolumes().size() > 1)
+            LOG_WARNING(log, "Storage policy for Distributed table has multiple volumes. "
+                             "Only {} volume will be used to store data. Other will be ignored.", data_volume->getName());
     }
 
     /// Sanity check. Skip check if the table is already created to allow the server to start.
@@ -599,7 +601,7 @@ void StorageDistributed::startup()
     if (!storage_policy)
         return;
 
-    for (const DiskPtr & disk : storage_policy->getDisks())
+    for (const DiskPtr & disk : data_volume->getDisks())
         createDirectoryMonitors(disk->getPath());
 
     for (const String & path : getDataPaths())
@@ -633,7 +635,7 @@ void StorageDistributed::drop()
 
     LOG_DEBUG(log, "Removing pending blocks for async INSERT from filesystem on DROP TABLE");
 
-    auto disks = storage_policy->getDisks();
+    auto disks = data_volume->getDisks();
     for (const auto & disk : disks)
         disk->removeRecursive(relative_data_path);
 
@@ -647,7 +649,7 @@ Strings StorageDistributed::getDataPaths() const
     if (relative_data_path.empty())
         return paths;
 
-    for (const DiskPtr & disk : storage_policy->getDisks())
+    for (const DiskPtr & disk : data_volume->getDisks())
         paths.push_back(disk->getPath() + relative_data_path);
 
     return paths;
@@ -866,7 +868,7 @@ void StorageDistributed::rename(const String & new_path_to_table_data, const Sto
 
 void StorageDistributed::renameOnDisk(const String & new_path_to_table_data)
 {
-    for (const DiskPtr & disk : storage_policy->getDisks())
+    for (const DiskPtr & disk : data_volume->getDisks())
     {
         const String path(disk->getPath());
         auto new_path = path + new_path_to_table_data;
diff --git a/src/Storages/StorageDistributed.h b/src/Storages/StorageDistributed.h
index a29a147d4bc..7e4e9f56ab4 100644
--- a/src/Storages/StorageDistributed.h
+++ b/src/Storages/StorageDistributed.h
@@ -183,6 +183,11 @@ protected:
 
     /// Can be empty if relative_data_path is empty. In this case, a directory for the data to be sent is not created.
     StoragePolicyPtr storage_policy;
+    /// The main volume to store data.
+    /// Storage policy may have several configured volumes, but second and other volumes are used for parts movement in MergeTree engine.
+    /// For Distributed engine such configuration doesn't make sense and only the first (main) volume will be used to store data.
+    /// Other volumes will be ignored. It's needed to allow using the same multi-volume policy both for Distributed and other engines.
+    VolumePtr data_volume;
 
     struct ClusterNodeData
     {

From 51ba12c2c3106d9277bbc223adfe41fdb3e45439 Mon Sep 17 00:00:00 2001
From: Artem Zuikov <chertus@gmail.com>
Date: Tue, 15 Sep 2020 12:55:57 +0300
Subject: [PATCH 233/341] Try speedup build (#14809)

---
 base/common/arithmeticOverflow.h              |   2 +-
 base/common/extended_types.h                  | 108 ++++++++++++++++
 base/common/types.h                           | 115 +++---------------
 src/Access/AccessFlags.h                      |   2 +-
 src/Access/AccessRights.h                     |   2 +-
 src/Access/AccessType.h                       |   6 +-
 src/Access/AllowedClientHosts.h               |   5 +-
 src/Access/Authentication.h                   |   2 +-
 src/Access/EnabledRowPolicies.h               |   2 +-
 src/Access/EnabledSettings.h                  |   2 +-
 src/Access/ExternalAuthenticators.h           |   2 +-
 src/Access/IAccessEntity.h                    |   2 +-
 src/Access/IAccessStorage.h                   |   2 +-
 src/Access/LDAPClient.h                       |   2 +-
 src/Access/LDAPParams.h                       |   2 +-
 src/Access/SettingsProfilesCache.h            |   2 +-
 .../AggregateFunctionRankCorrelation.h        |   2 +-
 src/AggregateFunctions/IAggregateFunction.h   |   2 +-
 src/AggregateFunctions/QuantileExact.h        |   2 +-
 src/Columns/ColumnsNumber.h                   |   2 +-
 src/Common/BitonicSort.h                      |   2 +-
 .../Config/AbstractConfigurationComparison.h  |   2 +-
 src/Common/CpuId.h                            |   2 +-
 src/Common/CurrentMetrics.h                   |   2 +-
 src/Common/DNSResolver.cpp                    |   2 +-
 src/Common/DNSResolver.h                      |   2 +-
 src/Common/ExternalLoaderStatus.h             |   2 +-
 src/Common/HashTable/Hash.h                   |   2 +-
 src/Common/HashTable/HashTable.h              |   2 +-
 src/Common/IFactoryWithAliases.h              |   2 +-
 src/Common/IntervalKind.h                     |   2 +-
 src/Common/Macros.h                           |   2 +-
 src/Common/NaNUtils.h                         |   2 +-
 src/Common/NamePrompter.h                     |   2 +-
 src/Common/OpenSSLHelpers.h                   |   2 +-
 src/Common/PoolWithFailoverBase.h             |   1 -
 src/Common/QueryProfiler.h                    |   2 +-
 src/Common/RWLock.h                           |   2 +-
 src/Common/RadixSort.h                        |   2 +-
 src/Common/StatusInfo.h                       |   3 +-
 src/Common/TaskStatsInfoGetter.cpp            |   2 +-
 src/Common/TaskStatsInfoGetter.h              |   2 +-
 src/Common/ThreadProfileEvents.h              |   2 +-
 src/Common/UTF8Helpers.h                      |   2 +-
 src/Common/UnicodeBar.h                       |   2 +-
 src/Common/Volnitsky.h                        |   2 +-
 src/Common/ZooKeeper/IKeeper.h                |   2 +-
 src/Common/ZooKeeper/TestKeeper.cpp           |   2 +-
 src/Common/ZooKeeper/ZooKeeperImpl.h          |   2 +-
 src/Common/createHardLink.h                   |   2 +-
 src/Common/filesystemHelpers.h                |   2 +-
 src/Common/intExp.h                           |   2 +-
 src/Common/isLocalAddress.cpp                 |   2 +-
 src/Common/oclBasics.h                        |   2 +-
 src/Common/parseRemoteDescription.h           |   2 +-
 src/Common/quoteString.h                      |   2 +-
 src/Common/randomSeed.cpp                     |   2 +-
 src/Common/randomSeed.h                       |   2 +-
 src/Common/tests/average.cpp                  |   2 +-
 src/Common/tests/gtest_shell_command.cpp      |   2 +-
 .../tests/integer_hash_tables_and_hashes.cpp  |   2 +-
 src/Common/tests/pod_array.cpp                |   2 +-
 src/Compression/CompressedWriteBuffer.cpp     |   2 +-
 src/Compression/CompressionCodecT64.h         |   2 +-
 src/Compression/ICompressionCodec.h           |   2 +-
 .../tests/gtest_compressionCodec.cpp          |   2 +-
 src/Core/BlockInfo.cpp                        |   2 +-
 src/Core/BlockInfo.h                          |   2 +-
 src/Core/DecimalFunctions.h                   |   1 -
 src/Core/MySQL/Authentication.h               |   2 +-
 src/Core/MySQL/MySQLClient.h                  |   2 +-
 src/Core/MySQL/MySQLReplication.h             |   2 +-
 src/Core/Protocol.h                           |   2 +-
 src/Core/QueryProcessingStage.h               |   2 +-
 src/Core/SettingsFields.h                     |   2 +-
 src/Core/Types.h                              |  27 ++--
 src/Core/tests/gtest_multienum.cpp            |   2 +-
 src/DataStreams/BlockStreamProfileInfo.h      |   2 +-
 src/DataStreams/ExecutionSpeedLimits.h        |   2 +-
 src/DataStreams/MarkInCompressedFile.h        |   2 +-
 src/DataStreams/NativeBlockOutputStream.h     |   2 +-
 src/DataTypes/convertMySQLDataType.cpp        |   2 +-
 src/Databases/DatabasesCommon.h               |   2 +-
 src/Databases/IDatabase.h                     |   2 +-
 src/Databases/MySQL/MaterializeMetadata.h     |   2 +-
 src/Dictionaries/PolygonDictionaryUtils.h     |   6 +-
 .../tests/gtest_dictionary_configuration.cpp  |   2 +-
 src/Disks/DiskFactory.h                       |   2 +-
 src/Disks/IDisk.h                             |   2 +-
 src/Disks/S3/ProxyConfiguration.h             |   2 +-
 src/Formats/FormatFactory.h                   |   2 +-
 src/Formats/FormatSchemaInfo.h                |   2 +-
 src/Formats/FormatSettings.h                  |   2 +-
 src/Formats/IRowOutputStream.h                |   2 +-
 src/Formats/ParsedTemplateFormatString.h      |   4 +-
 src/Formats/ProtobufColumnMatcher.h           |   2 +-
 src/Formats/ProtobufSchemas.h                 |   2 +-
 src/Functions/CustomWeekTransforms.h          |   2 +-
 src/Functions/DateTimeTransforms.h            |   2 +-
 src/Functions/DummyJSONParser.h               |   2 +-
 src/Functions/FunctionsLogical.h              |   2 +-
 src/Functions/GatherUtils/Algorithms.h        |   2 +-
 src/Functions/GeoHash.h                       |   2 +-
 src/Functions/PolygonUtils.h                  |   2 +-
 src/Functions/RapidJSONParser.h               |   2 +-
 src/Functions/SimdJSONParser.h                |   2 +-
 src/Functions/TargetSpecific.h                |   2 +-
 src/Functions/VectorExtension.h               |   2 +-
 src/Functions/abtesting.h                     |   2 +-
 src/Functions/formatString.h                  |   2 +-
 src/Functions/likePatternToRegexp.h           |   2 +-
 src/IO/BitHelpers.h                           |   2 +-
 src/IO/HexWriteBuffer.cpp                     |   2 +-
 src/IO/LimitReadBuffer.h                      |   2 +-
 src/IO/ReadWriteBufferFromHTTP.h              |   2 +-
 src/IO/S3Common.h                             |   2 +-
 src/IO/VarInt.h                               |   2 +-
 src/IO/WriteBufferFromS3.h                    |   2 +-
 src/IO/WriteBufferValidUTF8.cpp               |   2 +-
 src/IO/tests/gtest_bit_io.cpp                 |   2 +-
 src/IO/tests/gtest_peekable_read_buffer.cpp   |   2 +-
 src/IO/tests/o_direct_and_dirty_pages.cpp     |   2 +-
 src/IO/tests/read_buffer.cpp                  |   2 +-
 src/IO/tests/read_buffer_perf.cpp             |   2 +-
 src/IO/tests/read_float_perf.cpp              |   2 +-
 src/IO/tests/read_write_int.cpp               |   2 +-
 src/IO/tests/write_buffer.cpp                 |   2 +-
 src/IO/tests/write_buffer_perf.cpp            |   2 +-
 src/Interpreters/ActionLocksManager.h         |   2 +-
 src/Interpreters/Aliases.h                    |   2 +-
 src/Interpreters/BloomFilter.h                |   2 +-
 src/Interpreters/ClientInfo.h                 |   2 +-
 src/Interpreters/Context.h                    |   2 +-
 src/Interpreters/DatabaseAndTableWithAlias.h  |   2 +-
 src/Interpreters/ExternalLoader.h             |   2 +-
 .../ExternalLoaderTempConfigRepository.h      |   2 +-
 .../ExternalLoaderXMLConfigRepository.h       |   2 +-
 src/Interpreters/IExternalLoadable.h          |   2 +-
 .../InJoinSubqueriesPreprocessor.h            |   2 +-
 src/Interpreters/InterpreterSelectQuery.cpp   |   2 +-
 src/Interpreters/InterserverIOHandler.h       |   2 +-
 src/Interpreters/RequiredSourceColumnsData.h  |   2 +-
 src/Interpreters/RowRefs.cpp                  |   2 +-
 src/Interpreters/StorageID.h                  |   2 +-
 src/Interpreters/SystemLog.h                  |   2 +-
 src/Interpreters/TablesStatus.h               |   2 +-
 src/Interpreters/addTypeConversionToAST.h     |   2 +-
 src/Interpreters/tests/hash_map.cpp           |   2 +-
 src/Interpreters/tests/hash_map3.cpp          |   2 +-
 src/Interpreters/tests/hash_map_lookup.cpp    |   2 +-
 src/Interpreters/tests/hash_map_string.cpp    |   2 +-
 src/Interpreters/tests/hash_map_string_2.cpp  |   2 +-
 src/Interpreters/tests/hash_map_string_3.cpp  |   2 +-
 .../tests/hash_map_string_small.cpp           |   2 +-
 src/Interpreters/tests/string_hash_map.cpp    |   2 +-
 src/Interpreters/tests/two_level_hash_map.cpp |   2 +-
 .../ASTFunctionWithKeyValueArguments.h        |   2 +-
 src/Parsers/ASTRolesOrUsersSet.h              |   3 +
 src/Parsers/ASTShowCreateAccessEntityQuery.h  |   2 +
 src/Parsers/IAST.h                            |   2 +-
 src/Parsers/IParser.h                         |   2 +-
 src/Parsers/StringRange.h                     |   2 +-
 src/Parsers/formatSettingName.h               |   2 +-
 src/Parsers/tests/gtest_dictionary_parser.cpp |   2 +-
 src/Parsers/tests/lexer.cpp                   |   2 +-
 src/Parsers/tests/lexer_fuzzer.cpp            |   2 +-
 .../Formats/Impl/ArrowColumnToCHColumn.cpp    |   2 +-
 src/Server/StaticRequestHandler.h             |   2 +-
 src/Storages/CheckResults.h                   |   2 +-
 src/Storages/ColumnDependency.h               |   2 +-
 src/Storages/IStorage_fwd.h                   |   2 +-
 src/Storages/IndicesDescription.h             |   2 +-
 .../Kafka/ReadBufferFromKafkaConsumer.h       |   2 +-
 src/Storages/MergeTree/ActiveDataPartSet.h    |   5 +-
 .../MergeTree/BackgroundProcessingPool.h      |   2 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |   2 +-
 src/Storages/MergeTree/MergeAlgorithm.h       |   2 +-
 .../MergeTree/MergeTreeDataFormatVersion.h    |   2 +-
 .../MergeTree/MergeTreeDataPartChecksum.h     |   2 +-
 .../MergeTree/MergeTreeDataPartType.h         |   2 +-
 .../MergeTree/MergeTreeIndexBloomFilter.cpp   |   2 +-
 .../MergeTree/MergeTreeIndexGranularityInfo.h |   2 +-
 .../MergeTree/MergeTreeMutationEntry.h        |   2 +-
 .../MergeTree/MergeTreeMutationStatus.h       |   2 +-
 src/Storages/MergeTree/MergeTreePartInfo.h    |   2 +-
 src/Storages/MergeTree/MergeTreePartition.h   |   2 +-
 src/Storages/MergeTree/MergeType.h            |   2 +-
 .../MergeTree/ReplicatedMergeTreeAddress.h    |   2 +-
 .../ReplicatedMergeTreeBlockOutputStream.h    |   2 +-
 .../ReplicatedMergeTreeCleanupThread.h        |   2 +-
 .../MergeTree/ReplicatedMergeTreeLogEntry.h   |   2 +-
 .../ReplicatedMergeTreeMutationEntry.h        |   2 +-
 .../ReplicatedMergeTreePartCheckThread.h      |   2 +-
 .../MergeTree/ReplicatedMergeTreePartHeader.h |   2 +-
 .../ReplicatedMergeTreeQuorumEntry.h          |   2 +-
 .../ReplicatedMergeTreeRestartingThread.h     |   2 +-
 .../ReplicatedMergeTreeTableMetadata.h        |   2 +-
 src/Storages/MergeTree/TTLMergeSelector.h     |   2 +-
 src/Storages/MergeTree/localBackup.h          |   2 +-
 src/Storages/PartitionCommands.h              |   2 +-
 .../RabbitMQ/ReadBufferFromRabbitMQConsumer.h |   2 +-
 src/Storages/StorageLogSettings.h             |   2 +-
 src/Storages/StorageS3Settings.h              |   3 +-
 .../transformQueryForExternalDatabase.h       |   2 +-
 src/TableFunctions/TableFunctionNumbers.h     |   2 +-
 src/TableFunctions/TableFunctionView.h        |   2 +-
 src/TableFunctions/TableFunctionZeros.h       |   2 +-
 207 files changed, 354 insertions(+), 321 deletions(-)
 create mode 100644 base/common/extended_types.h

diff --git a/base/common/arithmeticOverflow.h b/base/common/arithmeticOverflow.h
index e228af287e2..c20fd635924 100644
--- a/base/common/arithmeticOverflow.h
+++ b/base/common/arithmeticOverflow.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <common/types.h>
+#include <common/extended_types.h>
 
 namespace common
 {
diff --git a/base/common/extended_types.h b/base/common/extended_types.h
new file mode 100644
index 00000000000..fe5f7184954
--- /dev/null
+++ b/base/common/extended_types.h
@@ -0,0 +1,108 @@
+#pragma once
+
+#include <type_traits>
+
+#include <common/types.h>
+#include <common/wide_integer.h>
+
+using Int128 = __int128;
+
+using wInt256 = wide::integer<256, signed>;
+using wUInt256 = wide::integer<256, unsigned>;
+
+static_assert(sizeof(wInt256) == 32);
+static_assert(sizeof(wUInt256) == 32);
+
+/// The standard library type traits, such as std::is_arithmetic, with one exception
+/// (std::common_type), are "set in stone". Attempting to specialize them causes undefined behavior.
+/// So instead of using the std type_traits, we use our own version which allows extension.
+template <typename T>
+struct is_signed
+{
+    static constexpr bool value = std::is_signed_v<T>;
+};
+
+template <> struct is_signed<Int128> { static constexpr bool value = true; };
+template <> struct is_signed<wInt256> { static constexpr bool value = true; };
+
+template <typename T>
+inline constexpr bool is_signed_v = is_signed<T>::value;
+
+template <typename T>
+struct is_unsigned
+{
+    static constexpr bool value = std::is_unsigned_v<T>;
+};
+
+template <> struct is_unsigned<wUInt256> { static constexpr bool value = true; };
+
+template <typename T>
+inline constexpr bool is_unsigned_v = is_unsigned<T>::value;
+
+
+/// TODO: is_integral includes char, char8_t and wchar_t.
+template <typename T>
+struct is_integer
+{
+    static constexpr bool value = std::is_integral_v<T>;
+};
+
+template <> struct is_integer<Int128> { static constexpr bool value = true; };
+template <> struct is_integer<wInt256> { static constexpr bool value = true; };
+template <> struct is_integer<wUInt256> { static constexpr bool value = true; };
+
+template <typename T>
+inline constexpr bool is_integer_v = is_integer<T>::value;
+
+
+template <typename T>
+struct is_arithmetic
+{
+    static constexpr bool value = std::is_arithmetic_v<T>;
+};
+
+template <> struct is_arithmetic<__int128> { static constexpr bool value = true; };
+
+template <typename T>
+inline constexpr bool is_arithmetic_v = is_arithmetic<T>::value;
+
+template <typename T>
+struct make_unsigned
+{
+    typedef std::make_unsigned_t<T> type;
+};
+
+template <> struct make_unsigned<Int128> { using type = unsigned __int128; };
+template <> struct make_unsigned<wInt256>  { using type = wUInt256; };
+template <> struct make_unsigned<wUInt256> { using type = wUInt256; };
+
+template <typename T> using make_unsigned_t = typename make_unsigned<T>::type;
+
+template <typename T>
+struct make_signed
+{
+    typedef std::make_signed_t<T> type;
+};
+
+template <> struct make_signed<wInt256>  { using type = wInt256; };
+template <> struct make_signed<wUInt256> { using type = wInt256; };
+
+template <typename T> using make_signed_t = typename make_signed<T>::type;
+
+template <typename T>
+struct is_big_int
+{
+    static constexpr bool value = false;
+};
+
+template <> struct is_big_int<wInt256> { static constexpr bool value = true; };
+template <> struct is_big_int<wUInt256> { static constexpr bool value = true; };
+
+template <typename T>
+inline constexpr bool is_big_int_v = is_big_int<T>::value;
+
+template <typename To, typename From>
+inline To bigint_cast(const From & x [[maybe_unused]])
+{
+    return static_cast<To>(x);
+}
diff --git a/base/common/types.h b/base/common/types.h
index 2982781ce1f..f3572da2972 100644
--- a/base/common/types.h
+++ b/base/common/types.h
@@ -2,9 +2,6 @@
 
 #include <cstdint>
 #include <string>
-#include <type_traits>
-
-#include <common/wide_integer.h>
 
 using Int8 = int8_t;
 using Int16 = int16_t;
@@ -21,106 +18,24 @@ using UInt16 = uint16_t;
 using UInt32 = uint32_t;
 using UInt64 = uint64_t;
 
-using Int128 = __int128;
+using String = std::string;
 
-using wInt256 = wide::integer<256, signed>;
-using wUInt256 = wide::integer<256, unsigned>;
+namespace DB
+{
 
-static_assert(sizeof(wInt256) == 32);
-static_assert(sizeof(wUInt256) == 32);
+using UInt8 = ::UInt8;
+using UInt16 = ::UInt16;
+using UInt32 = ::UInt32;
+using UInt64 = ::UInt64;
+
+using Int8 = ::Int8;
+using Int16 = ::Int16;
+using Int32 = ::Int32;
+using Int64 = ::Int64;
+
+using Float32 = float;
+using Float64 = double;
 
 using String = std::string;
 
-/// The standard library type traits, such as std::is_arithmetic, with one exception
-/// (std::common_type), are "set in stone". Attempting to specialize them causes undefined behavior.
-/// So instead of using the std type_traits, we use our own version which allows extension.
-template <typename T>
-struct is_signed
-{
-    static constexpr bool value = std::is_signed_v<T>;
-};
-
-template <> struct is_signed<Int128> { static constexpr bool value = true; };
-template <> struct is_signed<wInt256> { static constexpr bool value = true; };
-
-template <typename T>
-inline constexpr bool is_signed_v = is_signed<T>::value;
-
-template <typename T>
-struct is_unsigned
-{
-    static constexpr bool value = std::is_unsigned_v<T>;
-};
-
-template <> struct is_unsigned<wUInt256> { static constexpr bool value = true; };
-
-template <typename T>
-inline constexpr bool is_unsigned_v = is_unsigned<T>::value;
-
-
-/// TODO: is_integral includes char, char8_t and wchar_t.
-template <typename T>
-struct is_integer
-{
-    static constexpr bool value = std::is_integral_v<T>;
-};
-
-template <> struct is_integer<Int128> { static constexpr bool value = true; };
-template <> struct is_integer<wInt256> { static constexpr bool value = true; };
-template <> struct is_integer<wUInt256> { static constexpr bool value = true; };
-
-template <typename T>
-inline constexpr bool is_integer_v = is_integer<T>::value;
-
-
-template <typename T>
-struct is_arithmetic
-{
-    static constexpr bool value = std::is_arithmetic_v<T>;
-};
-
-template <> struct is_arithmetic<__int128> { static constexpr bool value = true; };
-
-template <typename T>
-inline constexpr bool is_arithmetic_v = is_arithmetic<T>::value;
-
-template <typename T>
-struct make_unsigned
-{
-    typedef std::make_unsigned_t<T> type;
-};
-
-template <> struct make_unsigned<Int128> { using type = unsigned __int128; };
-template <> struct make_unsigned<wInt256>  { using type = wUInt256; };
-template <> struct make_unsigned<wUInt256> { using type = wUInt256; };
-
-template <typename T> using make_unsigned_t = typename make_unsigned<T>::type;
-
-template <typename T>
-struct make_signed
-{
-    typedef std::make_signed_t<T> type;
-};
-
-template <> struct make_signed<wInt256>  { using type = wInt256; };
-template <> struct make_signed<wUInt256> { using type = wInt256; };
-
-template <typename T> using make_signed_t = typename make_signed<T>::type;
-
-template <typename T>
-struct is_big_int
-{
-    static constexpr bool value = false;
-};
-
-template <> struct is_big_int<wInt256> { static constexpr bool value = true; };
-template <> struct is_big_int<wUInt256> { static constexpr bool value = true; };
-
-template <typename T>
-inline constexpr bool is_big_int_v = is_big_int<T>::value;
-
-template <typename To, typename From>
-inline To bigint_cast(const From & x [[maybe_unused]])
-{
-    return static_cast<To>(x);
 }
diff --git a/src/Access/AccessFlags.h b/src/Access/AccessFlags.h
index 3cb92b6b855..049140586ea 100644
--- a/src/Access/AccessFlags.h
+++ b/src/Access/AccessFlags.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Access/AccessType.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 #include <ext/range.h>
 #include <ext/push_back.h>
diff --git a/src/Access/AccessRights.h b/src/Access/AccessRights.h
index 8e150070f53..c610795ab45 100644
--- a/src/Access/AccessRights.h
+++ b/src/Access/AccessRights.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Access/AccessRightsElement.h>
 #include <memory>
 #include <vector>
diff --git a/src/Access/AccessType.h b/src/Access/AccessType.h
index dae86e62434..11896f628d9 100644
--- a/src/Access/AccessType.h
+++ b/src/Access/AccessType.h
@@ -1,13 +1,17 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <boost/algorithm/string/case_conv.hpp>
 #include <boost/algorithm/string/replace.hpp>
 #include <array>
+#include <vector>
 
 
 namespace DB
 {
+
+using Strings = std::vector<String>;
+
 /// Represents an access type which can be granted on databases, tables, columns, etc.
 enum class AccessType
 {
diff --git a/src/Access/AllowedClientHosts.h b/src/Access/AllowedClientHosts.h
index 2baafb2e04a..615782d75a2 100644
--- a/src/Access/AllowedClientHosts.h
+++ b/src/Access/AllowedClientHosts.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Poco/Net/IPAddress.h>
 #include <memory>
 #include <vector>
@@ -11,6 +11,9 @@
 
 namespace DB
 {
+
+using Strings = std::vector<String>;
+
 /// Represents lists of hosts an user is allowed to connect to server from.
 class AllowedClientHosts
 {
diff --git a/src/Access/Authentication.h b/src/Access/Authentication.h
index 35ff0fa1d32..38714339221 100644
--- a/src/Access/Authentication.h
+++ b/src/Access/Authentication.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 #include <Common/OpenSSLHelpers.h>
 #include <Poco/SHA1Engine.h>
diff --git a/src/Access/EnabledRowPolicies.h b/src/Access/EnabledRowPolicies.h
index b92939afb03..0ca4f16fcf1 100644
--- a/src/Access/EnabledRowPolicies.h
+++ b/src/Access/EnabledRowPolicies.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Access/RowPolicy.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/UUID.h>
 #include <boost/smart_ptr/atomic_shared_ptr.hpp>
 #include <unordered_map>
diff --git a/src/Access/EnabledSettings.h b/src/Access/EnabledSettings.h
index cc30e4481fc..80635ca4542 100644
--- a/src/Access/EnabledSettings.h
+++ b/src/Access/EnabledSettings.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/UUID.h>
 #include <Access/SettingsConstraints.h>
 #include <Access/SettingsProfileElement.h>
diff --git a/src/Access/ExternalAuthenticators.h b/src/Access/ExternalAuthenticators.h
index 54af87604a6..7484996c472 100644
--- a/src/Access/ExternalAuthenticators.h
+++ b/src/Access/ExternalAuthenticators.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Access/LDAPParams.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include <map>
 #include <memory>
diff --git a/src/Access/IAccessEntity.h b/src/Access/IAccessEntity.h
index 68e14c99982..18b450bff5c 100644
--- a/src/Access/IAccessEntity.h
+++ b/src/Access/IAccessEntity.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/typeid_cast.h>
 #include <Common/quoteString.h>
 #include <boost/algorithm/string.hpp>
diff --git a/src/Access/IAccessStorage.h b/src/Access/IAccessStorage.h
index 7851f8c9b6b..d91927e79d9 100644
--- a/src/Access/IAccessStorage.h
+++ b/src/Access/IAccessStorage.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Access/IAccessEntity.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/UUID.h>
 #include <ext/scope_guard.h>
 #include <functional>
diff --git a/src/Access/LDAPClient.h b/src/Access/LDAPClient.h
index 5aad2ed3061..b117ed9a026 100644
--- a/src/Access/LDAPClient.h
+++ b/src/Access/LDAPClient.h
@@ -5,7 +5,7 @@
 #endif
 
 #include <Access/LDAPParams.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 #if USE_LDAP
 #   include <ldap.h>
diff --git a/src/Access/LDAPParams.h b/src/Access/LDAPParams.h
index 0d7c7dd17cd..2168ce45203 100644
--- a/src/Access/LDAPParams.h
+++ b/src/Access/LDAPParams.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include <chrono>
 
diff --git a/src/Access/SettingsProfilesCache.h b/src/Access/SettingsProfilesCache.h
index 42dd05df351..ef3cfa51665 100644
--- a/src/Access/SettingsProfilesCache.h
+++ b/src/Access/SettingsProfilesCache.h
@@ -2,7 +2,7 @@
 
 #include <Access/EnabledSettings.h>
 #include <Core/UUID.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <ext/scope_guard.h>
 #include <map>
 #include <unordered_map>
diff --git a/src/AggregateFunctions/AggregateFunctionRankCorrelation.h b/src/AggregateFunctions/AggregateFunctionRankCorrelation.h
index 379a8332f09..15057940ebd 100644
--- a/src/AggregateFunctions/AggregateFunctionRankCorrelation.h
+++ b/src/AggregateFunctions/AggregateFunctionRankCorrelation.h
@@ -6,7 +6,7 @@
 #include <Columns/ColumnTuple.h>
 #include <Common/assert_cast.h>
 #include <Common/FieldVisitors.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <DataTypes/DataTypesDecimal.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypesNumber.h>
diff --git a/src/AggregateFunctions/IAggregateFunction.h b/src/AggregateFunctions/IAggregateFunction.h
index 7e6b7abbd28..b9656c31fa3 100644
--- a/src/AggregateFunctions/IAggregateFunction.h
+++ b/src/AggregateFunctions/IAggregateFunction.h
@@ -5,7 +5,7 @@
 #include <vector>
 #include <type_traits>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/ColumnNumbers.h>
 #include <Core/Block.h>
 #include <Common/Exception.h>
diff --git a/src/AggregateFunctions/QuantileExact.h b/src/AggregateFunctions/QuantileExact.h
index da0f644721b..3f5a0907126 100644
--- a/src/AggregateFunctions/QuantileExact.h
+++ b/src/AggregateFunctions/QuantileExact.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <algorithm>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBuffer.h>
 #include <IO/VarInt.h>
 #include <IO/WriteBuffer.h>
diff --git a/src/Columns/ColumnsNumber.h b/src/Columns/ColumnsNumber.h
index c206b37a588..96ce2bd6d6f 100644
--- a/src/Columns/ColumnsNumber.h
+++ b/src/Columns/ColumnsNumber.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Columns/ColumnVector.h>
 
 
diff --git a/src/Common/BitonicSort.h b/src/Common/BitonicSort.h
index 6bf10ebe835..8140687c040 100644
--- a/src/Common/BitonicSort.h
+++ b/src/Common/BitonicSort.h
@@ -12,7 +12,7 @@
 #endif
 
 #include <ext/bit_cast.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Defines.h>
 #include <Common/PODArray.h>
 #include <Columns/ColumnsCommon.h>
diff --git a/src/Common/Config/AbstractConfigurationComparison.h b/src/Common/Config/AbstractConfigurationComparison.h
index f0d126a578a..f825ad4e53d 100644
--- a/src/Common/Config/AbstractConfigurationComparison.h
+++ b/src/Common/Config/AbstractConfigurationComparison.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace Poco::Util
 {
diff --git a/src/Common/CpuId.h b/src/Common/CpuId.h
index 1548ff6cc40..2db247173a6 100644
--- a/src/Common/CpuId.h
+++ b/src/Common/CpuId.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 #if defined(__x86_64__) || defined(__i386__)
 #include <cpuid.h>
diff --git a/src/Common/CurrentMetrics.h b/src/Common/CurrentMetrics.h
index 09accf96010..eabeca7a0e9 100644
--- a/src/Common/CurrentMetrics.h
+++ b/src/Common/CurrentMetrics.h
@@ -4,7 +4,7 @@
 #include <cstdint>
 #include <utility>
 #include <atomic>
-#include <Core/Types.h>
+#include <common/types.h>
 
 /** Allows to count number of simultaneously happening processes or current value of some metric.
   *  - for high-level profiling.
diff --git a/src/Common/DNSResolver.cpp b/src/Common/DNSResolver.cpp
index d61982f3406..9059d2838bb 100644
--- a/src/Common/DNSResolver.cpp
+++ b/src/Common/DNSResolver.cpp
@@ -3,7 +3,7 @@
 #include <Common/Exception.h>
 #include <Common/ProfileEvents.h>
 #include <Core/Names.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Poco/Net/IPAddress.h>
 #include <Poco/Net/DNS.h>
 #include <Poco/Net/NetException.h>
diff --git a/src/Common/DNSResolver.h b/src/Common/DNSResolver.h
index 7dbc2852d43..57c28188f58 100644
--- a/src/Common/DNSResolver.h
+++ b/src/Common/DNSResolver.h
@@ -2,7 +2,7 @@
 #include <Poco/Net/IPAddress.h>
 #include <Poco/Net/SocketAddress.h>
 #include <memory>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Names.h>
 #include <boost/noncopyable.hpp>
 #include <common/logger_useful.h>
diff --git a/src/Common/ExternalLoaderStatus.h b/src/Common/ExternalLoaderStatus.h
index 44536198b82..d8852eb6152 100644
--- a/src/Common/ExternalLoaderStatus.h
+++ b/src/Common/ExternalLoaderStatus.h
@@ -3,7 +3,7 @@
 #include <vector>
 #include <utility>
 #include <ostream>
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Common/HashTable/Hash.h b/src/Common/HashTable/Hash.h
index c561933ab80..abd1a69545f 100644
--- a/src/Common/HashTable/Hash.h
+++ b/src/Common/HashTable/Hash.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/BigInt.h>
 #include <Common/UInt128.h>
 #include <common/unaligned.h>
diff --git a/src/Common/HashTable/HashTable.h b/src/Common/HashTable/HashTable.h
index 5c8e7917eb0..baad5d40764 100644
--- a/src/Common/HashTable/HashTable.h
+++ b/src/Common/HashTable/HashTable.h
@@ -9,7 +9,7 @@
 #include <boost/noncopyable.hpp>
 
 #include <Core/Defines.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 
 #include <IO/WriteBuffer.h>
diff --git a/src/Common/IFactoryWithAliases.h b/src/Common/IFactoryWithAliases.h
index 994b2c1a02c..11ebf31db33 100644
--- a/src/Common/IFactoryWithAliases.h
+++ b/src/Common/IFactoryWithAliases.h
@@ -2,7 +2,7 @@
 
 #include <Common/Exception.h>
 #include <Common/NamePrompter.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Poco/String.h>
 
 #include <unordered_map>
diff --git a/src/Common/IntervalKind.h b/src/Common/IntervalKind.h
index 91c3eb14043..a086d0d2b0c 100644
--- a/src/Common/IntervalKind.h
+++ b/src/Common/IntervalKind.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Common/Macros.h b/src/Common/Macros.h
index cee133b0ccb..bcd6075782e 100644
--- a/src/Common/Macros.h
+++ b/src/Common/Macros.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Names.h>
 #include <Interpreters/StorageID.h>
 
diff --git a/src/Common/NaNUtils.h b/src/Common/NaNUtils.h
index 7d727fb7793..3b393fad41e 100644
--- a/src/Common/NaNUtils.h
+++ b/src/Common/NaNUtils.h
@@ -4,7 +4,7 @@
 #include <limits>
 #include <type_traits>
 
-#include <common/types.h>
+#include <common/extended_types.h>
 
 
 /// To be sure, that this function is zero-cost for non-floating point types.
diff --git a/src/Common/NamePrompter.h b/src/Common/NamePrompter.h
index a52a5f3775e..5f7832c4423 100644
--- a/src/Common/NamePrompter.h
+++ b/src/Common/NamePrompter.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/PODArray.h>
 
 #include <algorithm>
diff --git a/src/Common/OpenSSLHelpers.h b/src/Common/OpenSSLHelpers.h
index e77fc3037c1..2560664de9e 100644
--- a/src/Common/OpenSSLHelpers.h
+++ b/src/Common/OpenSSLHelpers.h
@@ -5,7 +5,7 @@
 #endif
 
 #if USE_SSL
-#    include <Core/Types.h>
+#    include <common/types.h>
 
 
 namespace DB
diff --git a/src/Common/PoolWithFailoverBase.h b/src/Common/PoolWithFailoverBase.h
index f206278fbda..a328e15e4e5 100644
--- a/src/Common/PoolWithFailoverBase.h
+++ b/src/Common/PoolWithFailoverBase.h
@@ -7,7 +7,6 @@
 #include <functional>
 #include <common/types.h>
 #include <ext/scope_guard.h>
-#include <Core/Types.h>
 #include <Common/PoolBase.h>
 #include <Common/ProfileEvents.h>
 #include <Common/NetException.h>
diff --git a/src/Common/QueryProfiler.h b/src/Common/QueryProfiler.h
index 44eeebbf10a..8e2d09e0be2 100644
--- a/src/Common/QueryProfiler.h
+++ b/src/Common/QueryProfiler.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <signal.h>
 #include <time.h>
 
diff --git a/src/Common/RWLock.h b/src/Common/RWLock.h
index ad0a3f139fc..952c8049a0f 100644
--- a/src/Common/RWLock.h
+++ b/src/Common/RWLock.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include <chrono>
 #include <list>
diff --git a/src/Common/RadixSort.h b/src/Common/RadixSort.h
index cbb8badab4a..22e93a2c324 100644
--- a/src/Common/RadixSort.h
+++ b/src/Common/RadixSort.h
@@ -13,7 +13,7 @@
 #include <type_traits>
 
 #include <ext/bit_cast.h>
-#include <Core/Types.h>
+#include <common/extended_types.h>
 #include <Core/Defines.h>
 
 
diff --git a/src/Common/StatusInfo.h b/src/Common/StatusInfo.h
index 89365f0634f..de92bb838ba 100644
--- a/src/Common/StatusInfo.h
+++ b/src/Common/StatusInfo.h
@@ -4,7 +4,8 @@
 #include <cstdint>
 #include <utility>
 #include <atomic>
-#include <Core/Types.h>
+#include <vector>
+#include <common/types.h>
 #include <mutex>
 #include <unordered_map>
 
diff --git a/src/Common/TaskStatsInfoGetter.cpp b/src/Common/TaskStatsInfoGetter.cpp
index 40b92917343..92978a0ad8c 100644
--- a/src/Common/TaskStatsInfoGetter.cpp
+++ b/src/Common/TaskStatsInfoGetter.cpp
@@ -1,6 +1,6 @@
 #include "TaskStatsInfoGetter.h"
 #include <Common/Exception.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include <unistd.h>
 
diff --git a/src/Common/TaskStatsInfoGetter.h b/src/Common/TaskStatsInfoGetter.h
index 6865c64dc38..00ecf91c475 100644
--- a/src/Common/TaskStatsInfoGetter.h
+++ b/src/Common/TaskStatsInfoGetter.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <sys/types.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <boost/noncopyable.hpp>
 
 struct taskstats;
diff --git a/src/Common/ThreadProfileEvents.h b/src/Common/ThreadProfileEvents.h
index 6bec7b38db5..69db595b426 100644
--- a/src/Common/ThreadProfileEvents.h
+++ b/src/Common/ThreadProfileEvents.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/ProfileEvents.h>
 #include <sys/time.h>
 #include <sys/resource.h>
diff --git a/src/Common/UTF8Helpers.h b/src/Common/UTF8Helpers.h
index 129a745afe2..e795b6846b2 100644
--- a/src/Common/UTF8Helpers.h
+++ b/src/Common/UTF8Helpers.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/BitHelpers.h>
 #include <Poco/UTF8Encoding.h>
 
diff --git a/src/Common/UnicodeBar.h b/src/Common/UnicodeBar.h
index 13c39f680aa..9a5bcecbd62 100644
--- a/src/Common/UnicodeBar.h
+++ b/src/Common/UnicodeBar.h
@@ -3,7 +3,7 @@
 #include <cstring>
 #include <cmath>
 #include <string>
-#include <Core/Types.h>
+#include <common/types.h>
 
 #define UNICODE_BAR_CHAR_SIZE (strlen("█"))
 
diff --git a/src/Common/Volnitsky.h b/src/Common/Volnitsky.h
index af97dbdae13..a1fa83b4f33 100644
--- a/src/Common/Volnitsky.h
+++ b/src/Common/Volnitsky.h
@@ -4,7 +4,7 @@
 #include <vector>
 #include <stdint.h>
 #include <string.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Poco/Unicode.h>
 #include <Common/StringSearcher.h>
 #include <Common/StringUtils/StringUtils.h>
diff --git a/src/Common/ZooKeeper/IKeeper.h b/src/Common/ZooKeeper/IKeeper.h
index 409c3838147..9d4a2ebb16a 100644
--- a/src/Common/ZooKeeper/IKeeper.h
+++ b/src/Common/ZooKeeper/IKeeper.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 
 #include <vector>
diff --git a/src/Common/ZooKeeper/TestKeeper.cpp b/src/Common/ZooKeeper/TestKeeper.cpp
index 1b203d92fb8..4f7beadef5f 100644
--- a/src/Common/ZooKeeper/TestKeeper.cpp
+++ b/src/Common/ZooKeeper/TestKeeper.cpp
@@ -1,7 +1,7 @@
 #include <Common/ZooKeeper/TestKeeper.h>
 #include <Common/setThreadName.h>
 #include <Common/StringUtils/StringUtils.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include <sstream>
 #include <iomanip>
diff --git a/src/Common/ZooKeeper/ZooKeeperImpl.h b/src/Common/ZooKeeper/ZooKeeperImpl.h
index 305ee46d58a..085b0e9856a 100644
--- a/src/Common/ZooKeeper/ZooKeeperImpl.h
+++ b/src/Common/ZooKeeper/ZooKeeperImpl.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/ConcurrentBoundedQueue.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/ThreadPool.h>
diff --git a/src/Common/createHardLink.h b/src/Common/createHardLink.h
index 8f8e5c27d9f..c2b01cf817b 100644
--- a/src/Common/createHardLink.h
+++ b/src/Common/createHardLink.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Common/filesystemHelpers.h b/src/Common/filesystemHelpers.h
index 80a1cf10cb4..f97f91d2647 100644
--- a/src/Common/filesystemHelpers.h
+++ b/src/Common/filesystemHelpers.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 
 #include <filesystem>
diff --git a/src/Common/intExp.h b/src/Common/intExp.h
index 8a52015c54a..bc977a41d33 100644
--- a/src/Common/intExp.h
+++ b/src/Common/intExp.h
@@ -3,7 +3,7 @@
 #include <cstdint>
 #include <limits>
 
-#include <common/types.h>
+#include <common/extended_types.h>
 
 // Also defined in Core/Defines.h
 #if !defined(NO_SANITIZE_UNDEFINED)
diff --git a/src/Common/isLocalAddress.cpp b/src/Common/isLocalAddress.cpp
index 3e81ecd935c..8da281e3051 100644
--- a/src/Common/isLocalAddress.cpp
+++ b/src/Common/isLocalAddress.cpp
@@ -1,7 +1,7 @@
 #include <Common/isLocalAddress.h>
 
 #include <cstring>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Poco/Util/Application.h>
 #include <Poco/Net/NetworkInterface.h>
 #include <Poco/Net/SocketAddress.h>
diff --git a/src/Common/oclBasics.h b/src/Common/oclBasics.h
index 7c977830e82..a3e7636af1b 100644
--- a/src/Common/oclBasics.h
+++ b/src/Common/oclBasics.h
@@ -14,7 +14,7 @@
 #endif
 
 #include <algorithm>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 
 
diff --git a/src/Common/parseRemoteDescription.h b/src/Common/parseRemoteDescription.h
index cbc73380628..6ba0bb4737f 100644
--- a/src/Common/parseRemoteDescription.h
+++ b/src/Common/parseRemoteDescription.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <Core/Types.h>
+#include <common/types.h>
 #include <vector>
 namespace DB
 {
diff --git a/src/Common/quoteString.h b/src/Common/quoteString.h
index 426034e4803..3d395a35b03 100644
--- a/src/Common/quoteString.h
+++ b/src/Common/quoteString.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <common/StringRef.h>
 
 
diff --git a/src/Common/randomSeed.cpp b/src/Common/randomSeed.cpp
index 4d466d283c9..8ad624febdd 100644
--- a/src/Common/randomSeed.cpp
+++ b/src/Common/randomSeed.cpp
@@ -4,7 +4,7 @@
 #include <Common/Exception.h>
 #include <Common/randomSeed.h>
 #include <Common/SipHash.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Common/randomSeed.h b/src/Common/randomSeed.h
index e2b8310f79c..4f04e4b974a 100644
--- a/src/Common/randomSeed.h
+++ b/src/Common/randomSeed.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <cstdint>
-#include <Core/Types.h>
+#include <common/types.h>
 
 /** Returns a number suitable as seed for PRNG. Use clock_gettime, pid and so on. */
 DB::UInt64 randomSeed();
diff --git a/src/Common/tests/average.cpp b/src/Common/tests/average.cpp
index 900e99ee752..5f3b13af8e8 100644
--- a/src/Common/tests/average.cpp
+++ b/src/Common/tests/average.cpp
@@ -3,7 +3,7 @@
 
 #include <fmt/format.h>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/PODArray.h>
 #include <Common/HashTable/FixedHashMap.h>
 #include <Common/Arena.h>
diff --git a/src/Common/tests/gtest_shell_command.cpp b/src/Common/tests/gtest_shell_command.cpp
index 057a4d22648..4d578422962 100644
--- a/src/Common/tests/gtest_shell_command.cpp
+++ b/src/Common/tests/gtest_shell_command.cpp
@@ -1,5 +1,5 @@
 #include <iostream>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/ShellCommand.h>
 #include <IO/copyData.h>
 #include <IO/WriteBufferFromFileDescriptor.h>
diff --git a/src/Common/tests/integer_hash_tables_and_hashes.cpp b/src/Common/tests/integer_hash_tables_and_hashes.cpp
index 5b090fa6e4e..f5d9150a6ad 100644
--- a/src/Common/tests/integer_hash_tables_and_hashes.cpp
+++ b/src/Common/tests/integer_hash_tables_and_hashes.cpp
@@ -12,7 +12,7 @@
 //#define DBMS_HASH_MAP_COUNT_COLLISIONS
 //#define DBMS_HASH_MAP_DEBUG_RESIZES
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <Common/HashTable/HashMap.h>
diff --git a/src/Common/tests/pod_array.cpp b/src/Common/tests/pod_array.cpp
index 6e9634ba3cf..7ebf2670271 100644
--- a/src/Common/tests/pod_array.cpp
+++ b/src/Common/tests/pod_array.cpp
@@ -1,5 +1,5 @@
 #include <Common/PODArray.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <iostream>
 
 #define ASSERT_CHECK(cond, res)                        \
diff --git a/src/Compression/CompressedWriteBuffer.cpp b/src/Compression/CompressedWriteBuffer.cpp
index 092da9e4364..02f418dcdf7 100644
--- a/src/Compression/CompressedWriteBuffer.cpp
+++ b/src/Compression/CompressedWriteBuffer.cpp
@@ -2,7 +2,7 @@
 #include <string.h>
 
 #include <common/unaligned.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include "CompressedWriteBuffer.h"
 #include <Compression/CompressionFactory.h>
diff --git a/src/Compression/CompressionCodecT64.h b/src/Compression/CompressionCodecT64.h
index 9671eb81ce1..06c34ba0a4a 100644
--- a/src/Compression/CompressionCodecT64.h
+++ b/src/Compression/CompressionCodecT64.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Compression/ICompressionCodec.h>
 
 
diff --git a/src/Compression/ICompressionCodec.h b/src/Compression/ICompressionCodec.h
index 8f72ba55200..8d7d3fc800c 100644
--- a/src/Compression/ICompressionCodec.h
+++ b/src/Compression/ICompressionCodec.h
@@ -3,7 +3,7 @@
 #include <memory>
 #include <boost/noncopyable.hpp>
 #include <Compression/CompressionInfo.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/IAST.h>
 #include <Common/SipHash.h>
 
diff --git a/src/Compression/tests/gtest_compressionCodec.cpp b/src/Compression/tests/gtest_compressionCodec.cpp
index 4677efce5da..e9470536ae8 100644
--- a/src/Compression/tests/gtest_compressionCodec.cpp
+++ b/src/Compression/tests/gtest_compressionCodec.cpp
@@ -2,7 +2,7 @@
 
 #include <Common/PODArray.h>
 #include <Common/Stopwatch.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/IDataType.h>
 #include <IO/ReadBufferFromMemory.h>
diff --git a/src/Core/BlockInfo.cpp b/src/Core/BlockInfo.cpp
index 78ee165bad1..9f88513cd3c 100644
--- a/src/Core/BlockInfo.cpp
+++ b/src/Core/BlockInfo.cpp
@@ -1,4 +1,4 @@
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 #include <IO/ReadBuffer.h>
 #include <IO/WriteBuffer.h>
diff --git a/src/Core/BlockInfo.h b/src/Core/BlockInfo.h
index 886ecd96ef4..c8dd1576b22 100644
--- a/src/Core/BlockInfo.h
+++ b/src/Core/BlockInfo.h
@@ -2,7 +2,7 @@
 
 #include <unordered_map>
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Core/DecimalFunctions.h b/src/Core/DecimalFunctions.h
index b821d29dd0d..cd5a2b5a670 100644
--- a/src/Core/DecimalFunctions.h
+++ b/src/Core/DecimalFunctions.h
@@ -1,5 +1,4 @@
 #pragma once
-// Moved Decimal-related functions out from Core/Types.h to reduce compilation time.
 
 #include <Core/Types.h>
 #include <Common/Exception.h>
diff --git a/src/Core/MySQL/Authentication.h b/src/Core/MySQL/Authentication.h
index 3874655e523..e1b7c174139 100644
--- a/src/Core/MySQL/Authentication.h
+++ b/src/Core/MySQL/Authentication.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Interpreters/Context.h>
 #include <Core/MySQL/PacketEndpoint.h>
 
diff --git a/src/Core/MySQL/MySQLClient.h b/src/Core/MySQL/MySQLClient.h
index 3fb86b35833..a31794acc42 100644
--- a/src/Core/MySQL/MySQLClient.h
+++ b/src/Core/MySQL/MySQLClient.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/MySQL/MySQLReplication.h>
 #include <IO/ReadBufferFromPocoSocket.h>
 #include <IO/ReadHelpers.h>
diff --git a/src/Core/MySQL/MySQLReplication.h b/src/Core/MySQL/MySQLReplication.h
index b63b103e87a..ad5e53ed200 100644
--- a/src/Core/MySQL/MySQLReplication.h
+++ b/src/Core/MySQL/MySQLReplication.h
@@ -2,7 +2,7 @@
 #include <Core/Field.h>
 #include <Core/MySQL/PacketsReplication.h>
 #include <Core/MySQL/MySQLGtid.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBuffer.h>
 #include <IO/WriteBuffer.h>
 
diff --git a/src/Core/Protocol.h b/src/Core/Protocol.h
index bc97e5d47d4..15630d0a6f8 100644
--- a/src/Core/Protocol.h
+++ b/src/Core/Protocol.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Core/QueryProcessingStage.h b/src/Core/QueryProcessingStage.h
index 658b504fc2c..b1ed4709df2 100644
--- a/src/Core/QueryProcessingStage.h
+++ b/src/Core/QueryProcessingStage.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Core/SettingsFields.h b/src/Core/SettingsFields.h
index 270d0c7c7d0..1a5676bd8a8 100644
--- a/src/Core/SettingsFields.h
+++ b/src/Core/SettingsFields.h
@@ -2,7 +2,7 @@
 
 #include <Poco/Timespan.h>
 #include <Poco/URI.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Field.h>
 #include <Core/MultiEnum.h>
 #include <boost/range/adaptor/map.hpp>
diff --git a/src/Core/Types.h b/src/Core/Types.h
index c23ac4a1379..3157598adc0 100644
--- a/src/Core/Types.h
+++ b/src/Core/Types.h
@@ -3,7 +3,7 @@
 #include <cstdint>
 #include <string>
 #include <vector>
-#include <common/types.h>
+#include <common/extended_types.h>
 
 
 namespace DB
@@ -13,6 +13,11 @@ namespace DB
 
 struct Null {};
 
+/// Ignore strange gcc warning https://gcc.gnu.org/bugzilla/show_bug.cgi?id=55776
+#if !__clang__
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wshadow"
+#endif
 /// @note Except explicitly described you should not assume on TypeIndex numbers and/or their orders in this enum.
 enum class TypeIndex
 {
@@ -52,27 +57,15 @@ enum class TypeIndex
     AggregateFunction,
     LowCardinality,
 };
+#if !__clang__
+#pragma GCC diagnostic pop
+#endif
 
-/// defined in common/types.h
-using UInt8 = ::UInt8;
-using UInt16 = ::UInt16;
-using UInt32 = ::UInt32;
-using UInt64 = ::UInt64;
+/// Other int defines are in common/types.h
 using UInt256 = ::wUInt256;
-
-using Int8 = ::Int8;
-using Int16 = ::Int16;
-using Int32 = ::Int32;
-using Int64 = ::Int64;
 using Int128 = ::Int128;
 using Int256 = ::wInt256;
 
-using Float32 = float;
-using Float64 = double;
-
-using String = std::string;
-
-
 /** Note that for types not used in DB, IsNumber is false.
   */
 template <typename T> constexpr bool IsNumber = false;
diff --git a/src/Core/tests/gtest_multienum.cpp b/src/Core/tests/gtest_multienum.cpp
index 70c7699aa5c..91cee6b316a 100644
--- a/src/Core/tests/gtest_multienum.cpp
+++ b/src/Core/tests/gtest_multienum.cpp
@@ -1,6 +1,6 @@
 #include <gtest/gtest.h>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <type_traits>
 #include <Core/MultiEnum.h>
 
diff --git a/src/DataStreams/BlockStreamProfileInfo.h b/src/DataStreams/BlockStreamProfileInfo.h
index 5f75cf9ddea..d068db89641 100644
--- a/src/DataStreams/BlockStreamProfileInfo.h
+++ b/src/DataStreams/BlockStreamProfileInfo.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <DataStreams/IBlockStream_fwd.h>
 #include <Common/Stopwatch.h>
 
diff --git a/src/DataStreams/ExecutionSpeedLimits.h b/src/DataStreams/ExecutionSpeedLimits.h
index 8f098bfd6b4..9ab58e12cf4 100644
--- a/src/DataStreams/ExecutionSpeedLimits.h
+++ b/src/DataStreams/ExecutionSpeedLimits.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Poco/Timespan.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <DataStreams/SizeLimits.h>
 
 namespace DB
diff --git a/src/DataStreams/MarkInCompressedFile.h b/src/DataStreams/MarkInCompressedFile.h
index 62886ffad57..94ff5414762 100644
--- a/src/DataStreams/MarkInCompressedFile.h
+++ b/src/DataStreams/MarkInCompressedFile.h
@@ -2,7 +2,7 @@
 
 #include <tuple>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/WriteHelpers.h>
 #include <Common/PODArray.h>
 
diff --git a/src/DataStreams/NativeBlockOutputStream.h b/src/DataStreams/NativeBlockOutputStream.h
index 720a779ec5e..64ccd267634 100644
--- a/src/DataStreams/NativeBlockOutputStream.h
+++ b/src/DataStreams/NativeBlockOutputStream.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <DataStreams/IBlockOutputStream.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <DataTypes/IDataType.h>
 
 namespace DB
diff --git a/src/DataTypes/convertMySQLDataType.cpp b/src/DataTypes/convertMySQLDataType.cpp
index 23899ea197a..a509cf8b091 100644
--- a/src/DataTypes/convertMySQLDataType.cpp
+++ b/src/DataTypes/convertMySQLDataType.cpp
@@ -1,7 +1,7 @@
 #include "convertMySQLDataType.h"
 
 #include <Core/Field.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/MultiEnum.h>
 #include <Core/SettingsEnums.h>
 #include <Parsers/ASTFunction.h>
diff --git a/src/Databases/DatabasesCommon.h b/src/Databases/DatabasesCommon.h
index 4c7ec1ec637..5e1e555a524 100644
--- a/src/Databases/DatabasesCommon.h
+++ b/src/Databases/DatabasesCommon.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/IAST.h>
 #include <Storages/IStorage_fwd.h>
diff --git a/src/Databases/IDatabase.h b/src/Databases/IDatabase.h
index d82755a7bc8..b28bd5fd599 100644
--- a/src/Databases/IDatabase.h
+++ b/src/Databases/IDatabase.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/IAST_fwd.h>
 #include <Storages/IStorage_fwd.h>
 #include <Storages/StorageInMemoryMetadata.h>
diff --git a/src/Databases/MySQL/MaterializeMetadata.h b/src/Databases/MySQL/MaterializeMetadata.h
index c036ea77940..5e77620e365 100644
--- a/src/Databases/MySQL/MaterializeMetadata.h
+++ b/src/Databases/MySQL/MaterializeMetadata.h
@@ -6,7 +6,7 @@
 
 #if USE_MYSQL
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/MySQL/MySQLReplication.h>
 #include <mysqlxx/Connection.h>
 #include <mysqlxx/PoolWithFailover.h>
diff --git a/src/Dictionaries/PolygonDictionaryUtils.h b/src/Dictionaries/PolygonDictionaryUtils.h
index 11ec28502af..cd99717f98a 100644
--- a/src/Dictionaries/PolygonDictionaryUtils.h
+++ b/src/Dictionaries/PolygonDictionaryUtils.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/ThreadPool.h>
 #include <Poco/Logger.h>
 
@@ -25,8 +25,8 @@ using Ring = IPolygonDictionary::Ring;
 using Box = bg::model::box<IPolygonDictionary::Point>;
 
 /** SlabsPolygonIndex builds index based on shooting ray down from point.
-  * When this ray crosses odd number of edges in single polygon, point is considered inside. 
-  * 
+  * When this ray crosses odd number of edges in single polygon, point is considered inside.
+  *
   * SlabsPolygonIndex divides plane into vertical slabs, separated by vertical lines going through all points.
   * For each slab, all edges falling in that slab are effectively stored.
   * For each find query, required slab is found with binary search, and result is computed
diff --git a/src/Dictionaries/tests/gtest_dictionary_configuration.cpp b/src/Dictionaries/tests/gtest_dictionary_configuration.cpp
index fc99a34cd42..453ce2b81f0 100644
--- a/src/Dictionaries/tests/gtest_dictionary_configuration.cpp
+++ b/src/Dictionaries/tests/gtest_dictionary_configuration.cpp
@@ -1,4 +1,4 @@
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Poco/Util/XMLConfiguration.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/DumpASTNode.h>
diff --git a/src/Disks/DiskFactory.h b/src/Disks/DiskFactory.h
index 50520381552..d41f14bd753 100644
--- a/src/Disks/DiskFactory.h
+++ b/src/Disks/DiskFactory.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Disks/IDisk.h>
 
 #include <functional>
diff --git a/src/Disks/IDisk.h b/src/Disks/IDisk.h
index 47387fb370a..688c1dfad42 100644
--- a/src/Disks/IDisk.h
+++ b/src/Disks/IDisk.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Core/Defines.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/Exception.h>
 #include <Disks/Executor.h>
diff --git a/src/Disks/S3/ProxyConfiguration.h b/src/Disks/S3/ProxyConfiguration.h
index 62aec0e005e..32a1c8d3c45 100644
--- a/src/Disks/S3/ProxyConfiguration.h
+++ b/src/Disks/S3/ProxyConfiguration.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <utility>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <aws/core/client/ClientConfiguration.h>
 #include <Poco/URI.h>
 
diff --git a/src/Formats/FormatFactory.h b/src/Formats/FormatFactory.h
index 54bff1eefc6..de53490dd3b 100644
--- a/src/Formats/FormatFactory.h
+++ b/src/Formats/FormatFactory.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Columns/IColumn.h>
 #include <DataStreams/IBlockStream_fwd.h>
 #include <IO/BufferWithOwnMemory.h>
diff --git a/src/Formats/FormatSchemaInfo.h b/src/Formats/FormatSchemaInfo.h
index 7af0d56a0cf..67f1baca84b 100644
--- a/src/Formats/FormatSchemaInfo.h
+++ b/src/Formats/FormatSchemaInfo.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 70173bc847d..cd5cab8cf5a 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Formats/IRowOutputStream.h b/src/Formats/IRowOutputStream.h
index 3b18603ee69..7cf6251cd0d 100644
--- a/src/Formats/IRowOutputStream.h
+++ b/src/Formats/IRowOutputStream.h
@@ -3,7 +3,7 @@
 #include <memory>
 #include <cstdint>
 #include <boost/noncopyable.hpp>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Formats/ParsedTemplateFormatString.h b/src/Formats/ParsedTemplateFormatString.h
index 2da8a074679..f2e801faeab 100644
--- a/src/Formats/ParsedTemplateFormatString.h
+++ b/src/Formats/ParsedTemplateFormatString.h
@@ -1,8 +1,9 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <functional>
 #include <optional>
+#include <vector>
 #include <Formats/FormatSchemaInfo.h>
 #include <Formats/FormatSettings.h>
 
@@ -10,6 +11,7 @@ namespace DB
 {
 
 class Block;
+using Strings = std::vector<String>;
 
 struct ParsedTemplateFormatString
 {
diff --git a/src/Formats/ProtobufColumnMatcher.h b/src/Formats/ProtobufColumnMatcher.h
index 03c5ec40fc6..35521be7a9b 100644
--- a/src/Formats/ProtobufColumnMatcher.h
+++ b/src/Formats/ProtobufColumnMatcher.h
@@ -8,7 +8,7 @@
 #    include <memory>
 #    include <unordered_map>
 #    include <vector>
-#    include <Core/Types.h>
+#    include <common/types.h>
 #    include <boost/blank.hpp>
 #    include <google/protobuf/descriptor.h>
 #    include <google/protobuf/descriptor.pb.h>
diff --git a/src/Formats/ProtobufSchemas.h b/src/Formats/ProtobufSchemas.h
index 590c479bcc8..05778a85343 100644
--- a/src/Formats/ProtobufSchemas.h
+++ b/src/Formats/ProtobufSchemas.h
@@ -5,7 +5,7 @@
 
 #include <memory>
 #include <unordered_map>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <boost/noncopyable.hpp>
 
 
diff --git a/src/Functions/CustomWeekTransforms.h b/src/Functions/CustomWeekTransforms.h
index 97752d51263..86e1c444a78 100644
--- a/src/Functions/CustomWeekTransforms.h
+++ b/src/Functions/CustomWeekTransforms.h
@@ -2,7 +2,7 @@
 #include <regex>
 #include <Columns/ColumnVector.h>
 #include <Columns/ColumnsNumber.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/DecimalFunctions.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/extractTimeZoneFromFunctionArguments.h>
diff --git a/src/Functions/DateTimeTransforms.h b/src/Functions/DateTimeTransforms.h
index 6e2c3ea9ea6..6220d10a17d 100644
--- a/src/Functions/DateTimeTransforms.h
+++ b/src/Functions/DateTimeTransforms.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/DecimalFunctions.h>
 #include <Common/Exception.h>
 #include <common/DateLUTImpl.h>
diff --git a/src/Functions/DummyJSONParser.h b/src/Functions/DummyJSONParser.h
index 4f4facba957..a71c90e4a19 100644
--- a/src/Functions/DummyJSONParser.h
+++ b/src/Functions/DummyJSONParser.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Common/Exception.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Functions/FunctionsLogical.h b/src/Functions/FunctionsLogical.h
index 474831b0b6d..068c3c6e63c 100644
--- a/src/Functions/FunctionsLogical.h
+++ b/src/Functions/FunctionsLogical.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Defines.h>
 #include <DataTypes/IDataType.h>
 #include <Functions/IFunctionImpl.h>
diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index e54538c76b3..769d23b66dc 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/FieldVisitors.h>
 #include "Sources.h"
 #include "Sinks.h"
diff --git a/src/Functions/GeoHash.h b/src/Functions/GeoHash.h
index 105384d714c..f918602d473 100644
--- a/src/Functions/GeoHash.h
+++ b/src/Functions/GeoHash.h
@@ -2,7 +2,7 @@
 
 #include <map>
 #include <vector>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Functions/PolygonUtils.h b/src/Functions/PolygonUtils.h
index 88743312304..c8e96f0b63a 100644
--- a/src/Functions/PolygonUtils.h
+++ b/src/Functions/PolygonUtils.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Defines.h>
 #include <Core/TypeListNumber.h>
 #include <Columns/IColumn.h>
diff --git a/src/Functions/RapidJSONParser.h b/src/Functions/RapidJSONParser.h
index e4d4718abc5..992480d64f7 100644
--- a/src/Functions/RapidJSONParser.h
+++ b/src/Functions/RapidJSONParser.h
@@ -5,7 +5,7 @@
 #endif
 
 #if USE_RAPIDJSON
-#    include <Core/Types.h>
+#    include <common/types.h>
 #    include <common/defines.h>
 #    include <rapidjson/document.h>
 
diff --git a/src/Functions/SimdJSONParser.h b/src/Functions/SimdJSONParser.h
index 30ecbce1ac5..a9adfa27e2c 100644
--- a/src/Functions/SimdJSONParser.h
+++ b/src/Functions/SimdJSONParser.h
@@ -5,7 +5,7 @@
 #endif
 
 #if USE_SIMDJSON
-#    include <Core/Types.h>
+#    include <common/types.h>
 #    include <Common/Exception.h>
 #    include <common/defines.h>
 #    include <simdjson.h>
diff --git a/src/Functions/TargetSpecific.h b/src/Functions/TargetSpecific.h
index ce20dfe2e60..bc433702180 100644
--- a/src/Functions/TargetSpecific.h
+++ b/src/Functions/TargetSpecific.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 /* This file contains macros and helpers for writing platform-dependent code.
  *
diff --git a/src/Functions/VectorExtension.h b/src/Functions/VectorExtension.h
index 24c2ae9a18f..bffc04a6024 100644
--- a/src/Functions/VectorExtension.h
+++ b/src/Functions/VectorExtension.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 // Contains types declarations and wrappers for GCC vector extension.
 
 namespace DB::VectorExtension
diff --git a/src/Functions/abtesting.h b/src/Functions/abtesting.h
index 1e9b9747505..24ec22e4a88 100644
--- a/src/Functions/abtesting.h
+++ b/src/Functions/abtesting.h
@@ -9,7 +9,7 @@
 #include <vector>
 #include <algorithm>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/PODArray.h>
 
 
diff --git a/src/Functions/formatString.h b/src/Functions/formatString.h
index 591015f14cb..bea4fa2e1bc 100644
--- a/src/Functions/formatString.h
+++ b/src/Functions/formatString.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Columns/ColumnString.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/memcpySmall.h>
diff --git a/src/Functions/likePatternToRegexp.h b/src/Functions/likePatternToRegexp.h
index 24cb6ea78c7..4301ad18ee0 100644
--- a/src/Functions/likePatternToRegexp.h
+++ b/src/Functions/likePatternToRegexp.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/IO/BitHelpers.h b/src/IO/BitHelpers.h
index 05eac24f1b0..0e2a08aa9a0 100644
--- a/src/IO/BitHelpers.h
+++ b/src/IO/BitHelpers.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/BitHelpers.h>
 #include <Common/Exception.h>
 
diff --git a/src/IO/HexWriteBuffer.cpp b/src/IO/HexWriteBuffer.cpp
index a7e804d00af..d7b8a993ce5 100644
--- a/src/IO/HexWriteBuffer.cpp
+++ b/src/IO/HexWriteBuffer.cpp
@@ -1,4 +1,4 @@
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/hex.h>
 #include <Common/Exception.h>
 #include <IO/HexWriteBuffer.h>
diff --git a/src/IO/LimitReadBuffer.h b/src/IO/LimitReadBuffer.h
index 545de6fd4a2..db3d2684ef7 100644
--- a/src/IO/LimitReadBuffer.h
+++ b/src/IO/LimitReadBuffer.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBuffer.h>
 
 
diff --git a/src/IO/ReadWriteBufferFromHTTP.h b/src/IO/ReadWriteBufferFromHTTP.h
index 0eb2136ca6c..48407f76938 100644
--- a/src/IO/ReadWriteBufferFromHTTP.h
+++ b/src/IO/ReadWriteBufferFromHTTP.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <functional>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ConnectionTimeouts.h>
 #include <IO/HTTPCommon.h>
 #include <IO/ReadBuffer.h>
diff --git a/src/IO/S3Common.h b/src/IO/S3Common.h
index 45ec0ad90c6..d411c903676 100644
--- a/src/IO/S3Common.h
+++ b/src/IO/S3Common.h
@@ -4,7 +4,7 @@
 
 #if USE_AWS_S3
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <aws/core/Aws.h>
 #include <aws/core/client/ClientConfiguration.h>
 #include <Poco/URI.h>
diff --git a/src/IO/VarInt.h b/src/IO/VarInt.h
index 30125f33081..8c57395a250 100644
--- a/src/IO/VarInt.h
+++ b/src/IO/VarInt.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <iostream>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBuffer.h>
 #include <IO/WriteBuffer.h>
 
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index cabda4f2171..93a6947609e 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -6,7 +6,7 @@
 
 #    include <memory>
 #    include <vector>
-#    include <Core/Types.h>
+#    include <common/types.h>
 #    include <IO/BufferWithOwnMemory.h>
 #    include <IO/HTTPCommon.h>
 #    include <IO/WriteBuffer.h>
diff --git a/src/IO/WriteBufferValidUTF8.cpp b/src/IO/WriteBufferValidUTF8.cpp
index 0e04aa4c22d..f1f04e9805b 100644
--- a/src/IO/WriteBufferValidUTF8.cpp
+++ b/src/IO/WriteBufferValidUTF8.cpp
@@ -1,6 +1,6 @@
 #include <Poco/UTF8Encoding.h>
 #include <IO/WriteBufferValidUTF8.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 #ifdef __SSE2__
     #include <emmintrin.h>
diff --git a/src/IO/tests/gtest_bit_io.cpp b/src/IO/tests/gtest_bit_io.cpp
index 437ec13e93c..f75abf92f30 100644
--- a/src/IO/tests/gtest_bit_io.cpp
+++ b/src/IO/tests/gtest_bit_io.cpp
@@ -1,7 +1,7 @@
 #include <string.h>
 #include <IO/BitHelpers.h>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/MemoryReadWriteBuffer.h>
 #include <IO/ReadBufferFromMemory.h>
 #include <Common/BitHelpers.h>
diff --git a/src/IO/tests/gtest_peekable_read_buffer.cpp b/src/IO/tests/gtest_peekable_read_buffer.cpp
index 0ba1e79799e..fb4b0b799b4 100644
--- a/src/IO/tests/gtest_peekable_read_buffer.cpp
+++ b/src/IO/tests/gtest_peekable_read_buffer.cpp
@@ -1,6 +1,6 @@
 #include <gtest/gtest.h>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadHelpers.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/ConcatReadBuffer.h>
diff --git a/src/IO/tests/o_direct_and_dirty_pages.cpp b/src/IO/tests/o_direct_and_dirty_pages.cpp
index 8387ecac9e4..327d6357e9b 100644
--- a/src/IO/tests/o_direct_and_dirty_pages.cpp
+++ b/src/IO/tests/o_direct_and_dirty_pages.cpp
@@ -2,7 +2,7 @@
 
 #include <iostream>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/WriteHelpers.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteBufferFromFile.h>
diff --git a/src/IO/tests/read_buffer.cpp b/src/IO/tests/read_buffer.cpp
index 952f8136a63..647382e667b 100644
--- a/src/IO/tests/read_buffer.cpp
+++ b/src/IO/tests/read_buffer.cpp
@@ -2,7 +2,7 @@
 
 #include <iostream>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadHelpers.h>
 #include <IO/ReadBufferFromString.h>
 
diff --git a/src/IO/tests/read_buffer_perf.cpp b/src/IO/tests/read_buffer_perf.cpp
index 74520a63041..a8198bce71f 100644
--- a/src/IO/tests/read_buffer_perf.cpp
+++ b/src/IO/tests/read_buffer_perf.cpp
@@ -2,7 +2,7 @@
 
 #include <iostream>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadHelpers.h>
 #include <IO/ReadBufferFromFile.h>
 
diff --git a/src/IO/tests/read_float_perf.cpp b/src/IO/tests/read_float_perf.cpp
index aa0fa8ad15d..acfd294e0e7 100644
--- a/src/IO/tests/read_float_perf.cpp
+++ b/src/IO/tests/read_float_perf.cpp
@@ -3,7 +3,7 @@
 #include <iostream>
 #include <fstream>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Stopwatch.h>
 #include <Common/formatReadable.h>
 #include <IO/readFloatText.h>
diff --git a/src/IO/tests/read_write_int.cpp b/src/IO/tests/read_write_int.cpp
index 903940db5e4..c09db10cbe2 100644
--- a/src/IO/tests/read_write_int.cpp
+++ b/src/IO/tests/read_write_int.cpp
@@ -2,7 +2,7 @@
 
 #include <iostream>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/WriteBufferFromString.h>
 #include <IO/ReadHelpers.h>
diff --git a/src/IO/tests/write_buffer.cpp b/src/IO/tests/write_buffer.cpp
index 8737f29cffb..14beb6d0539 100644
--- a/src/IO/tests/write_buffer.cpp
+++ b/src/IO/tests/write_buffer.cpp
@@ -2,7 +2,7 @@
 
 #include <iostream>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/WriteHelpers.h>
 #include <IO/WriteBufferFromOStream.h>
 
diff --git a/src/IO/tests/write_buffer_perf.cpp b/src/IO/tests/write_buffer_perf.cpp
index 14a636e4570..096b58cb7c4 100644
--- a/src/IO/tests/write_buffer_perf.cpp
+++ b/src/IO/tests/write_buffer_perf.cpp
@@ -3,7 +3,7 @@
 #include <iostream>
 #include <fstream>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/WriteHelpers.h>
 #include <IO/WriteBufferFromOStream.h>
 
diff --git a/src/Interpreters/ActionLocksManager.h b/src/Interpreters/ActionLocksManager.h
index ea5d96ad8ce..a39d8b5784f 100644
--- a/src/Interpreters/ActionLocksManager.h
+++ b/src/Interpreters/ActionLocksManager.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Storages/IStorage_fwd.h>
 #include <Common/ActionLock.h>
 #include <Interpreters/StorageID.h>
diff --git a/src/Interpreters/Aliases.h b/src/Interpreters/Aliases.h
index 52159442224..0bdffe27933 100644
--- a/src/Interpreters/Aliases.h
+++ b/src/Interpreters/Aliases.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/IAST_fwd.h>
 
 #include <unordered_map>
diff --git a/src/Interpreters/BloomFilter.h b/src/Interpreters/BloomFilter.h
index 0362f475d88..ccfb35bd68f 100644
--- a/src/Interpreters/BloomFilter.h
+++ b/src/Interpreters/BloomFilter.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <vector>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Field.h>
 #include <Common/PODArray.h>
 #include <Common/Allocator.h>
diff --git a/src/Interpreters/ClientInfo.h b/src/Interpreters/ClientInfo.h
index f3a99112170..99426716cb2 100644
--- a/src/Interpreters/ClientInfo.h
+++ b/src/Interpreters/ClientInfo.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Poco/Net/SocketAddress.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index 613889333c3..ff2af111885 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -3,7 +3,7 @@
 #include <Core/Block.h>
 #include <Core/NamesAndTypes.h>
 #include <Core/Settings.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/UUID.h>
 #include <DataStreams/IBlockStream_fwd.h>
 #include <Interpreters/ClientInfo.h>
diff --git a/src/Interpreters/DatabaseAndTableWithAlias.h b/src/Interpreters/DatabaseAndTableWithAlias.h
index d4a1a582fdc..07a41c12983 100644
--- a/src/Interpreters/DatabaseAndTableWithAlias.h
+++ b/src/Interpreters/DatabaseAndTableWithAlias.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Core/Names.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/NamesAndTypes.h>
 #include <Parsers/IAST_fwd.h>
 
diff --git a/src/Interpreters/ExternalLoader.h b/src/Interpreters/ExternalLoader.h
index 57b711d7f21..09915af2470 100644
--- a/src/Interpreters/ExternalLoader.h
+++ b/src/Interpreters/ExternalLoader.h
@@ -3,7 +3,7 @@
 #include <chrono>
 #include <functional>
 #include <unordered_map>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Interpreters/IExternalLoadable.h>
 #include <Interpreters/IExternalLoaderConfigRepository.h>
 #include <common/logger_useful.h>
diff --git a/src/Interpreters/ExternalLoaderTempConfigRepository.h b/src/Interpreters/ExternalLoaderTempConfigRepository.h
index 6ee717631cc..46e2eb846e9 100644
--- a/src/Interpreters/ExternalLoaderTempConfigRepository.h
+++ b/src/Interpreters/ExternalLoaderTempConfigRepository.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Interpreters/IExternalLoaderConfigRepository.h>
 #include <Poco/Timestamp.h>
 
diff --git a/src/Interpreters/ExternalLoaderXMLConfigRepository.h b/src/Interpreters/ExternalLoaderXMLConfigRepository.h
index b89bc06e196..dd689856300 100644
--- a/src/Interpreters/ExternalLoaderXMLConfigRepository.h
+++ b/src/Interpreters/ExternalLoaderXMLConfigRepository.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <unordered_map>
 #include <Interpreters/IExternalLoaderConfigRepository.h>
 #include <Poco/Timestamp.h>
diff --git a/src/Interpreters/IExternalLoadable.h b/src/Interpreters/IExternalLoadable.h
index 113d22df6bd..2d9a9abfa5f 100644
--- a/src/Interpreters/IExternalLoadable.h
+++ b/src/Interpreters/IExternalLoadable.h
@@ -4,7 +4,7 @@
 #include <memory>
 #include <boost/noncopyable.hpp>
 #include <pcg_random.hpp>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace Poco::Util
diff --git a/src/Interpreters/InJoinSubqueriesPreprocessor.h b/src/Interpreters/InJoinSubqueriesPreprocessor.h
index 8d2e441e05f..4d46fabfd99 100644
--- a/src/Interpreters/InJoinSubqueriesPreprocessor.h
+++ b/src/Interpreters/InJoinSubqueriesPreprocessor.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/IAST_fwd.h>
 #include <Storages/IStorage_fwd.h>
 
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index dbf6d5ae8d3..079fc792447 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -66,7 +66,7 @@
 
 #include <Functions/IFunction.h>
 #include <Core/Field.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Columns/Collator.h>
 #include <Common/FieldVisitorsAccurateComparison.h>
 #include <Common/typeid_cast.h>
diff --git a/src/Interpreters/InterserverIOHandler.h b/src/Interpreters/InterserverIOHandler.h
index 952c99ae46d..6d62c9651ca 100644
--- a/src/Interpreters/InterserverIOHandler.h
+++ b/src/Interpreters/InterserverIOHandler.h
@@ -7,7 +7,7 @@
 #include <IO/WriteBufferFromString.h>
 #include <IO/WriteHelpers.h>
 #include <Common/ActionBlocker.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <map>
 #include <atomic>
 #include <utility>
diff --git a/src/Interpreters/RequiredSourceColumnsData.h b/src/Interpreters/RequiredSourceColumnsData.h
index de1f3bc2721..d425989393e 100644
--- a/src/Interpreters/RequiredSourceColumnsData.h
+++ b/src/Interpreters/RequiredSourceColumnsData.h
@@ -4,7 +4,7 @@
 #include <optional>
 
 #include <Core/Names.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/IAST_fwd.h>
 
 namespace DB
diff --git a/src/Interpreters/RowRefs.cpp b/src/Interpreters/RowRefs.cpp
index a206456f1b6..7617f589eb7 100644
--- a/src/Interpreters/RowRefs.cpp
+++ b/src/Interpreters/RowRefs.cpp
@@ -1,7 +1,7 @@
 #include <Interpreters/RowRefs.h>
 
 #include <Core/Block.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/typeid_cast.h>
 #include <Common/ColumnsHashing.h>
 #include <Columns/IColumn.h>
diff --git a/src/Interpreters/StorageID.h b/src/Interpreters/StorageID.h
index 36265b2a2b0..9343f67fe7a 100644
--- a/src/Interpreters/StorageID.h
+++ b/src/Interpreters/StorageID.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/UUID.h>
 #include <tuple>
 #include <Parsers/IAST_fwd.h>
diff --git a/src/Interpreters/SystemLog.h b/src/Interpreters/SystemLog.h
index a2e97747d12..03b1b735cbc 100644
--- a/src/Interpreters/SystemLog.h
+++ b/src/Interpreters/SystemLog.h
@@ -8,7 +8,7 @@
 #include <condition_variable>
 #include <boost/noncopyable.hpp>
 #include <common/logger_useful.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Defines.h>
 #include <Storages/IStorage.h>
 #include <Common/Stopwatch.h>
diff --git a/src/Interpreters/TablesStatus.h b/src/Interpreters/TablesStatus.h
index c9e16e9615b..85290f69c87 100644
--- a/src/Interpreters/TablesStatus.h
+++ b/src/Interpreters/TablesStatus.h
@@ -3,7 +3,7 @@
 #include <unordered_set>
 #include <unordered_map>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/QualifiedTableName.h>
 
 namespace DB
diff --git a/src/Interpreters/addTypeConversionToAST.h b/src/Interpreters/addTypeConversionToAST.h
index 56c3a636f45..1951eebc3f5 100644
--- a/src/Interpreters/addTypeConversionToAST.h
+++ b/src/Interpreters/addTypeConversionToAST.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/IAST_fwd.h>
 
 
diff --git a/src/Interpreters/tests/hash_map.cpp b/src/Interpreters/tests/hash_map.cpp
index dc87fd9ddde..620f2515825 100644
--- a/src/Interpreters/tests/hash_map.cpp
+++ b/src/Interpreters/tests/hash_map.cpp
@@ -11,7 +11,7 @@
 /*
 #define DBMS_HASH_MAP_COUNT_COLLISIONS
 */
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Row.h>
 #include <IO/ReadBufferFromFile.h>
 #include <Compression/CompressedReadBuffer.h>
diff --git a/src/Interpreters/tests/hash_map3.cpp b/src/Interpreters/tests/hash_map3.cpp
index 1b4ce8eac77..132e6fe9e87 100644
--- a/src/Interpreters/tests/hash_map3.cpp
+++ b/src/Interpreters/tests/hash_map3.cpp
@@ -10,7 +10,7 @@
 
 #include <utility>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/Exception.h>
 
 #include <IO/ReadHelpers.h>
diff --git a/src/Interpreters/tests/hash_map_lookup.cpp b/src/Interpreters/tests/hash_map_lookup.cpp
index 926e6b6766e..39c43023b20 100644
--- a/src/Interpreters/tests/hash_map_lookup.cpp
+++ b/src/Interpreters/tests/hash_map_lookup.cpp
@@ -8,7 +8,7 @@
 #define DBMS_HASH_MAP_DEBUG_RESIZES
 
 #include <Compression/CompressedReadBuffer.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
 #include <Interpreters/AggregationCommon.h>
diff --git a/src/Interpreters/tests/hash_map_string.cpp b/src/Interpreters/tests/hash_map_string.cpp
index 2f35ea2bdc8..c51d1a6db01 100644
--- a/src/Interpreters/tests/hash_map_string.cpp
+++ b/src/Interpreters/tests/hash_map_string.cpp
@@ -12,7 +12,7 @@
 //#define DBMS_HASH_MAP_COUNT_COLLISIONS
 #define DBMS_HASH_MAP_DEBUG_RESIZES
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
 #include <Compression/CompressedReadBuffer.h>
diff --git a/src/Interpreters/tests/hash_map_string_2.cpp b/src/Interpreters/tests/hash_map_string_2.cpp
index 5f6954cb0b0..a75978c9e13 100644
--- a/src/Interpreters/tests/hash_map_string_2.cpp
+++ b/src/Interpreters/tests/hash_map_string_2.cpp
@@ -7,7 +7,7 @@
 //#define DBMS_HASH_MAP_COUNT_COLLISIONS
 #define DBMS_HASH_MAP_DEBUG_RESIZES
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
 #include <Compression/CompressedReadBuffer.h>
diff --git a/src/Interpreters/tests/hash_map_string_3.cpp b/src/Interpreters/tests/hash_map_string_3.cpp
index 3dfbe5fb0f2..d0bf9093374 100644
--- a/src/Interpreters/tests/hash_map_string_3.cpp
+++ b/src/Interpreters/tests/hash_map_string_3.cpp
@@ -10,7 +10,7 @@
 #define DBMS_HASH_MAP_COUNT_COLLISIONS
 #define DBMS_HASH_MAP_DEBUG_RESIZES
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
 #include <Compression/CompressedReadBuffer.h>
diff --git a/src/Interpreters/tests/hash_map_string_small.cpp b/src/Interpreters/tests/hash_map_string_small.cpp
index 7dac9691dc9..fe81c120d90 100644
--- a/src/Interpreters/tests/hash_map_string_small.cpp
+++ b/src/Interpreters/tests/hash_map_string_small.cpp
@@ -12,7 +12,7 @@
 //#define DBMS_HASH_MAP_COUNT_COLLISIONS
 #define DBMS_HASH_MAP_DEBUG_RESIZES
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
 #include <Compression/CompressedReadBuffer.h>
diff --git a/src/Interpreters/tests/string_hash_map.cpp b/src/Interpreters/tests/string_hash_map.cpp
index 3969458fced..3420918887c 100644
--- a/src/Interpreters/tests/string_hash_map.cpp
+++ b/src/Interpreters/tests/string_hash_map.cpp
@@ -2,7 +2,7 @@
 #include <iostream>
 #include <vector>
 #include <Compression/CompressedReadBuffer.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
 #include <Interpreters/AggregationCommon.h>
diff --git a/src/Interpreters/tests/two_level_hash_map.cpp b/src/Interpreters/tests/two_level_hash_map.cpp
index 604f0de2976..f79be16e095 100644
--- a/src/Interpreters/tests/two_level_hash_map.cpp
+++ b/src/Interpreters/tests/two_level_hash_map.cpp
@@ -12,7 +12,7 @@
 #include <Common/Stopwatch.h>
 #include <AggregateFunctions/UniquesHashSet.h>
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <Common/HashTable/TwoLevelHashTable.h>
diff --git a/src/Parsers/ASTFunctionWithKeyValueArguments.h b/src/Parsers/ASTFunctionWithKeyValueArguments.h
index 786d31d9e35..88ab712cc04 100644
--- a/src/Parsers/ASTFunctionWithKeyValueArguments.h
+++ b/src/Parsers/ASTFunctionWithKeyValueArguments.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Parsers/IAST.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Parsers/ASTRolesOrUsersSet.h b/src/Parsers/ASTRolesOrUsersSet.h
index f257ce1066c..f18aa0bdd73 100644
--- a/src/Parsers/ASTRolesOrUsersSet.h
+++ b/src/Parsers/ASTRolesOrUsersSet.h
@@ -5,6 +5,9 @@
 
 namespace DB
 {
+
+using Strings = std::vector<String>;
+
 /// Represents a set of users/roles like
 /// {user_name | role_name | CURRENT_USER} [,...] | NONE | ALL | ALL EXCEPT {user_name | role_name | CURRENT_USER} [,...]
 class ASTRolesOrUsersSet : public IAST
diff --git a/src/Parsers/ASTShowCreateAccessEntityQuery.h b/src/Parsers/ASTShowCreateAccessEntityQuery.h
index f112e9211fe..10c4c0ca511 100644
--- a/src/Parsers/ASTShowCreateAccessEntityQuery.h
+++ b/src/Parsers/ASTShowCreateAccessEntityQuery.h
@@ -8,6 +8,8 @@ namespace DB
 {
 class ASTRowPolicyNames;
 
+using Strings = std::vector<String>;
+
 /** SHOW CREATE USER [name | CURRENT_USER]
   * SHOW CREATE USERS [name [, name2 ...]
   * SHOW CREATE ROLE name
diff --git a/src/Parsers/IAST.h b/src/Parsers/IAST.h
index cf6a7efc102..c88c80021d6 100644
--- a/src/Parsers/IAST.h
+++ b/src/Parsers/IAST.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/IAST_fwd.h>
 #include <Parsers/IdentifierQuotingStyle.h>
 #include <Common/Exception.h>
diff --git a/src/Parsers/IParser.h b/src/Parsers/IParser.h
index 69c199c201e..05ceb8c900b 100644
--- a/src/Parsers/IParser.h
+++ b/src/Parsers/IParser.h
@@ -4,7 +4,7 @@
 #include <memory>
 
 #include <Core/Defines.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Settings.h>
 #include <IO/WriteHelpers.h>
 #include <Parsers/IAST.h>
diff --git a/src/Parsers/StringRange.h b/src/Parsers/StringRange.h
index 45b1b0dfbd1..1fc285a562e 100644
--- a/src/Parsers/StringRange.h
+++ b/src/Parsers/StringRange.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/TokenIterator.h>
 #include <map>
 #include <memory>
diff --git a/src/Parsers/formatSettingName.h b/src/Parsers/formatSettingName.h
index 40f14d95b4f..c9ed94dcc7d 100644
--- a/src/Parsers/formatSettingName.h
+++ b/src/Parsers/formatSettingName.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/Parsers/tests/gtest_dictionary_parser.cpp b/src/Parsers/tests/gtest_dictionary_parser.cpp
index d1ec5088482..6b777af77a2 100644
--- a/src/Parsers/tests/gtest_dictionary_parser.cpp
+++ b/src/Parsers/tests/gtest_dictionary_parser.cpp
@@ -1,4 +1,4 @@
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTDropQuery.h>
 #include <Parsers/ParserCreateQuery.h>
diff --git a/src/Parsers/tests/lexer.cpp b/src/Parsers/tests/lexer.cpp
index b1d0bb6212c..d54267c135e 100644
--- a/src/Parsers/tests/lexer.cpp
+++ b/src/Parsers/tests/lexer.cpp
@@ -1,6 +1,6 @@
 #include <map>
 #include <Parsers/Lexer.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBufferFromFileDescriptor.h>
 #include <IO/WriteBufferFromFileDescriptor.h>
 #include <IO/ReadHelpers.h>
diff --git a/src/Parsers/tests/lexer_fuzzer.cpp b/src/Parsers/tests/lexer_fuzzer.cpp
index 8ebe39cb67b..8b0a7da238b 100644
--- a/src/Parsers/tests/lexer_fuzzer.cpp
+++ b/src/Parsers/tests/lexer_fuzzer.cpp
@@ -1,6 +1,6 @@
 #include <map>
 #include <Parsers/Lexer.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include <IO/ReadBufferFromMemory.h>
 #include <IO/ReadHelpers.h>
diff --git a/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp b/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
index bf825e367c8..4ad7743151a 100644
--- a/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
+++ b/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
@@ -8,7 +8,7 @@
 #include <DataTypes/DataTypesDecimal.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <common/DateLUTImpl.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Block.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnNullable.h>
diff --git a/src/Server/StaticRequestHandler.h b/src/Server/StaticRequestHandler.h
index 707087df24d..a5ac44683a1 100644
--- a/src/Server/StaticRequestHandler.h
+++ b/src/Server/StaticRequestHandler.h
@@ -4,7 +4,7 @@
 
 #include <Poco/Net/HTTPRequestHandler.h>
 #include <Common/StringUtils/StringUtils.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/WriteBuffer.h>
 
 
diff --git a/src/Storages/CheckResults.h b/src/Storages/CheckResults.h
index 245f580f625..8fa0bb910d3 100644
--- a/src/Storages/CheckResults.h
+++ b/src/Storages/CheckResults.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <vector>
 
 namespace DB
diff --git a/src/Storages/ColumnDependency.h b/src/Storages/ColumnDependency.h
index 3f5290efa35..606b8b3dc5f 100644
--- a/src/Storages/ColumnDependency.h
+++ b/src/Storages/ColumnDependency.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Common/SipHash.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <unordered_set>
 
 namespace DB
diff --git a/src/Storages/IStorage_fwd.h b/src/Storages/IStorage_fwd.h
index 015c74fa9a6..98ae9bea7c2 100644
--- a/src/Storages/IStorage_fwd.h
+++ b/src/Storages/IStorage_fwd.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include <map>
 #include <memory>
diff --git a/src/Storages/IndicesDescription.h b/src/Storages/IndicesDescription.h
index 464e466dcd0..f383029837e 100644
--- a/src/Storages/IndicesDescription.h
+++ b/src/Storages/IndicesDescription.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 #include <memory>
 #include <vector>
diff --git a/src/Storages/Kafka/ReadBufferFromKafkaConsumer.h b/src/Storages/Kafka/ReadBufferFromKafkaConsumer.h
index 6def7b8ec0b..1d889655941 100644
--- a/src/Storages/Kafka/ReadBufferFromKafkaConsumer.h
+++ b/src/Storages/Kafka/ReadBufferFromKafkaConsumer.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Core/Names.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBuffer.h>
 
 #include <cppkafka/cppkafka.h>
diff --git a/src/Storages/MergeTree/ActiveDataPartSet.h b/src/Storages/MergeTree/ActiveDataPartSet.h
index e17f4903a26..323ef3c4830 100644
--- a/src/Storages/MergeTree/ActiveDataPartSet.h
+++ b/src/Storages/MergeTree/ActiveDataPartSet.h
@@ -1,13 +1,16 @@
 #pragma once
 
 #include <Storages/MergeTree/MergeTreePartInfo.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <map>
+#include <vector>
 
 
 namespace DB
 {
 
+using Strings = std::vector<String>;
+
 /** Supports multiple names of active parts of data.
   * Repeats part of the MergeTreeData functionality.
   * TODO: generalize with MergeTreeData
diff --git a/src/Storages/MergeTree/BackgroundProcessingPool.h b/src/Storages/MergeTree/BackgroundProcessingPool.h
index 8bed696ab2c..c1e44ee5cc8 100644
--- a/src/Storages/MergeTree/BackgroundProcessingPool.h
+++ b/src/Storages/MergeTree/BackgroundProcessingPool.h
@@ -11,7 +11,7 @@
 #include <functional>
 #include <Poco/Event.h>
 #include <Poco/Timestamp.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/CurrentThread.h>
 #include <Common/ThreadPool.h>
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 7df0468dc13..78daf6c9017 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -4,7 +4,7 @@
 
 #include <Core/Row.h>
 #include <Core/Block.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/NamesAndTypes.h>
 #include <Storages/IStorage.h>
 #include <Storages/MergeTree/MergeTreeIndexGranularity.h>
diff --git a/src/Storages/MergeTree/MergeAlgorithm.h b/src/Storages/MergeTree/MergeAlgorithm.h
index 813767f9fb1..23d6fc7137e 100644
--- a/src/Storages/MergeTree/MergeAlgorithm.h
+++ b/src/Storages/MergeTree/MergeAlgorithm.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Storages/MergeTree/MergeTreeDataFormatVersion.h b/src/Storages/MergeTree/MergeTreeDataFormatVersion.h
index 4b492a9fb61..7b21ac31609 100644
--- a/src/Storages/MergeTree/MergeTreeDataFormatVersion.h
+++ b/src/Storages/MergeTree/MergeTreeDataFormatVersion.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <common/strong_typedef.h>
 
 namespace DB
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
index 89e1ba1d78a..3aa77678520 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
@@ -2,7 +2,7 @@
 #include <map>
 #include <optional>
 #include <city.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Disks/IDisk.h>
 #include <IO/ReadBuffer.h>
 #include <IO/WriteBuffer.h>
diff --git a/src/Storages/MergeTree/MergeTreeDataPartType.h b/src/Storages/MergeTree/MergeTreeDataPartType.h
index bb87918d3a5..44e170141f6 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartType.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartType.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp b/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
index 421d0e8b38c..5a5dfffe287 100644
--- a/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
@@ -2,7 +2,7 @@
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Interpreters/TreeRewriter.h>
 #include <Interpreters/ExpressionAnalyzer.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <ext/bit_cast.h>
 #include <Parsers/ASTLiteral.h>
 #include <IO/ReadHelpers.h>
diff --git a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.h b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.h
index a30d569150c..21a86f9bcea 100644
--- a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.h
+++ b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <optional>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Storages/MergeTree/MergeTreeDataPartType.h>
 #include <Disks/IDisk.h>
 
diff --git a/src/Storages/MergeTree/MergeTreeMutationEntry.h b/src/Storages/MergeTree/MergeTreeMutationEntry.h
index ccdea771e93..278babb67b9 100644
--- a/src/Storages/MergeTree/MergeTreeMutationEntry.h
+++ b/src/Storages/MergeTree/MergeTreeMutationEntry.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Disks/IDisk.h>
 #include <Storages/MergeTree/MergeTreePartInfo.h>
 #include <Storages/MutationCommands.h>
diff --git a/src/Storages/MergeTree/MergeTreeMutationStatus.h b/src/Storages/MergeTree/MergeTreeMutationStatus.h
index d3a66bd09d6..94d9294624f 100644
--- a/src/Storages/MergeTree/MergeTreeMutationStatus.h
+++ b/src/Storages/MergeTree/MergeTreeMutationStatus.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/Names.h>
 #include <optional>
 #include <map>
diff --git a/src/Storages/MergeTree/MergeTreePartInfo.h b/src/Storages/MergeTree/MergeTreePartInfo.h
index 80b0d3508e0..416308861b7 100644
--- a/src/Storages/MergeTree/MergeTreePartInfo.h
+++ b/src/Storages/MergeTree/MergeTreePartInfo.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <tuple>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <common/DayNum.h>
 #include <Storages/MergeTree/MergeTreeDataFormatVersion.h>
 
diff --git a/src/Storages/MergeTree/MergeTreePartition.h b/src/Storages/MergeTree/MergeTreePartition.h
index 947fb3ec504..f89b6f22d4f 100644
--- a/src/Storages/MergeTree/MergeTreePartition.h
+++ b/src/Storages/MergeTree/MergeTreePartition.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Core/Row.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Disks/IDisk.h>
 #include <IO/WriteBuffer.h>
 
diff --git a/src/Storages/MergeTree/MergeType.h b/src/Storages/MergeTree/MergeType.h
index 490c9b8c822..f7e99f98c8c 100644
--- a/src/Storages/MergeTree/MergeType.h
+++ b/src/Storages/MergeTree/MergeType.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeAddress.h b/src/Storages/MergeTree/ReplicatedMergeTreeAddress.h
index 2a620515278..8e7ab0c69fe 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeAddress.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeAddress.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBuffer.h>
 #include <IO/WriteBuffer.h>
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.h b/src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.h
index ac169d248c2..fa3ede20c28 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.h
@@ -2,7 +2,7 @@
 
 #include <DataStreams/IBlockOutputStream.h>
 #include <Storages/MergeTree/MergeTreeData.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace Poco { class Logger; }
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.h b/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.h
index f4191482d64..520af888621 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Common/ZooKeeper/Types.h>
 #include <Common/ZooKeeper/ZooKeeper.h>
 #include <common/logger_useful.h>
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.h b/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.h
index 2f5d038291b..e14a884ca1c 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.h
@@ -2,7 +2,7 @@
 
 #include <Common/Exception.h>
 #include <Common/ZooKeeper/Types.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/WriteHelpers.h>
 #include <Storages/MergeTree/MergeTreeDataPartType.h>
 #include <Storages/MergeTree/MergeType.h>
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeMutationEntry.h b/src/Storages/MergeTree/ReplicatedMergeTreeMutationEntry.h
index 1b44a5dec75..cfcc3dec6f2 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeMutationEntry.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeMutationEntry.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Common/Exception.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/WriteHelpers.h>
 #include <Storages/MutationCommands.h>
 #include <map>
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
index e86356e1346..4239d7a8051 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
@@ -8,7 +8,7 @@
 #include <atomic>
 #include <boost/noncopyable.hpp>
 #include <Poco/Event.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <common/logger_useful.h>
 #include <Core/BackgroundSchedulePool.h>
 #include <Storages/CheckResults.h>
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartHeader.h b/src/Storages/MergeTree/ReplicatedMergeTreePartHeader.h
index 90cc327cf4b..7bc2b72d2d5 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartHeader.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartHeader.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Storages/MergeTree/MergeTreeDataPartChecksum.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/WriteBuffer.h>
 #include <IO/ReadBuffer.h>
 #include <IO/Operators.h>
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeQuorumEntry.h b/src/Storages/MergeTree/ReplicatedMergeTreeQuorumEntry.h
index e3bb658b2d0..ee12cabb5aa 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeQuorumEntry.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeQuorumEntry.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <set>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBuffer.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/WriteBuffer.h>
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeRestartingThread.h b/src/Storages/MergeTree/ReplicatedMergeTreeRestartingThread.h
index 1a8b0bf6378..bb032d9df8c 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeRestartingThread.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeRestartingThread.h
@@ -3,7 +3,7 @@
 #include <Poco/Event.h>
 #include <common/logger_useful.h>
 #include <Core/BackgroundSchedulePool.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <thread>
 #include <atomic>
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h b/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h
index 59b7c9bee47..c1c34637664 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h
@@ -2,7 +2,7 @@
 
 #include <Parsers/IAST.h>
 #include <Storages/MergeTree/MergeTreeDataFormatVersion.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Storages/StorageInMemoryMetadata.h>
 
 namespace DB
diff --git a/src/Storages/MergeTree/TTLMergeSelector.h b/src/Storages/MergeTree/TTLMergeSelector.h
index 1d41b65f9fb..73d364f28c7 100644
--- a/src/Storages/MergeTree/TTLMergeSelector.h
+++ b/src/Storages/MergeTree/TTLMergeSelector.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Storages/MergeTree/MergeSelector.h>
 #include <Storages/TTLDescription.h>
 
diff --git a/src/Storages/MergeTree/localBackup.h b/src/Storages/MergeTree/localBackup.h
index 3c9d92fa9da..630767c9ec6 100644
--- a/src/Storages/MergeTree/localBackup.h
+++ b/src/Storages/MergeTree/localBackup.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <optional>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Disks/IDisk.h>
 
 namespace DB
diff --git a/src/Storages/PartitionCommands.h b/src/Storages/PartitionCommands.h
index 242f8f5e2c1..e4f70305dbd 100644
--- a/src/Storages/PartitionCommands.h
+++ b/src/Storages/PartitionCommands.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Core/Field.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Parsers/IAST.h>
 #include <Storages/IStorage_fwd.h>
 
diff --git a/src/Storages/RabbitMQ/ReadBufferFromRabbitMQConsumer.h b/src/Storages/RabbitMQ/ReadBufferFromRabbitMQConsumer.h
index 1877fdfba35..109770c77e9 100644
--- a/src/Storages/RabbitMQ/ReadBufferFromRabbitMQConsumer.h
+++ b/src/Storages/RabbitMQ/ReadBufferFromRabbitMQConsumer.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <Core/Names.h>
-#include <Core/Types.h>
+#include <common/types.h>
 #include <IO/ReadBuffer.h>
 #include <amqpcpp.h>
 #include <Storages/RabbitMQ/RabbitMQHandler.h>
diff --git a/src/Storages/StorageLogSettings.h b/src/Storages/StorageLogSettings.h
index c970cd6be37..0918c50aa19 100644
--- a/src/Storages/StorageLogSettings.h
+++ b/src/Storages/StorageLogSettings.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 
 namespace DB
 {
diff --git a/src/Storages/StorageS3Settings.h b/src/Storages/StorageS3Settings.h
index ac31928a240..19b2bf48bd8 100644
--- a/src/Storages/StorageS3Settings.h
+++ b/src/Storages/StorageS3Settings.h
@@ -3,7 +3,8 @@
 #include <map>
 #include <memory>
 #include <mutex>
-#include <Core/Types.h>
+#include <vector>
+#include <common/types.h>
 
 namespace Poco::Util
 {
diff --git a/src/Storages/transformQueryForExternalDatabase.h b/src/Storages/transformQueryForExternalDatabase.h
index 09de53e36d3..c760c628970 100644
--- a/src/Storages/transformQueryForExternalDatabase.h
+++ b/src/Storages/transformQueryForExternalDatabase.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Core/Types.h>
+#include <common/types.h>
 #include <Core/NamesAndTypes.h>
 #include <Parsers/IdentifierQuotingStyle.h>
 #include <Storages/SelectQueryInfo.h>
diff --git a/src/TableFunctions/TableFunctionNumbers.h b/src/TableFunctions/TableFunctionNumbers.h
index c3efbc426ef..13064a3309e 100644
--- a/src/TableFunctions/TableFunctionNumbers.h
+++ b/src/TableFunctions/TableFunctionNumbers.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <TableFunctions/ITableFunction.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/TableFunctions/TableFunctionView.h b/src/TableFunctions/TableFunctionView.h
index 49f51823735..43d55a7dcb8 100644
--- a/src/TableFunctions/TableFunctionView.h
+++ b/src/TableFunctions/TableFunctionView.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <TableFunctions/ITableFunction.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB
diff --git a/src/TableFunctions/TableFunctionZeros.h b/src/TableFunctions/TableFunctionZeros.h
index 71570c23a89..cae4604b1d7 100644
--- a/src/TableFunctions/TableFunctionZeros.h
+++ b/src/TableFunctions/TableFunctionZeros.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include <TableFunctions/ITableFunction.h>
-#include <Core/Types.h>
+#include <common/types.h>
 
 
 namespace DB

From dd4d5bc931a3e94b8e2200e784b91fd98f05ce18 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 13:10:41 +0300
Subject: [PATCH 234/341] Fix build

---
 src/Functions/GatherUtils/Algorithms.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index e1e00f66c56..c95bbb9363d 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -146,7 +146,7 @@ inline ALWAYS_INLINE void writeSlice(const Slice & slice, NullableArraySink<Arra
 
 
 template <typename T, typename U>
-void ALWAYS_INLINE writeSlice(const NumericValueSlice<T> & slice, NumericArraySink<U> & sink)
+void inline ALWAYS_INLINE writeSlice(const NumericValueSlice<T> & slice, NumericArraySink<U> & sink)
 {
     sink.elements.resize(sink.current_offset + 1);
     sink.elements[sink.current_offset] = slice.value;

From 1ba67ea8a1aa3964677ebb534cf1837b691f1fe9 Mon Sep 17 00:00:00 2001
From: Artem Zuikov <chertus@gmail.com>
Date: Tue, 15 Sep 2020 13:31:15 +0300
Subject: [PATCH 235/341] Improve DecimalBinaryOperation specializations
 (#14743)

---
 src/Functions/FunctionBinaryArithmetic.h | 201 +++++++++--------------
 src/Functions/intDiv.cpp                 |   2 +-
 src/Functions/modulo.cpp                 |   2 +-
 3 files changed, 79 insertions(+), 126 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index bbac58a92c6..bbb08c4068f 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -65,7 +65,7 @@ namespace ErrorCodes
   */
 
 template <typename A, typename B, typename Op, typename ResultType_ = typename Op::ResultType>
-struct BinaryOperationImplBase
+struct BinaryOperation
 {
     using ResultType = ResultType_;
     static const constexpr bool allow_fixed_string = false;
@@ -167,16 +167,24 @@ struct FixedStringOperationImpl
 
 
 template <typename A, typename B, typename Op, typename ResultType = typename Op::ResultType>
-struct BinaryOperationImpl : BinaryOperationImplBase<A, B, Op, ResultType>
+struct BinaryOperationImpl : BinaryOperation<A, B, Op, ResultType>
 {
 };
 
+template <typename T>
+inline constexpr const auto & undec(const T & x)
+{
+    if constexpr (IsDecimalNumber<T>)
+        return x.value;
+    else
+        return x;
+}
 
 /// Binary operations for Decimals need scale args
 /// +|- scale one of args (which scale factor is not 1). ScaleR = oneof(Scale1, Scale2);
 /// *   no agrs scale. ScaleR = Scale1 + Scale2;
 /// /   first arg scale. ScaleR = Scale1 (scale_a = DecimalType<B>::getScale()).
-template <typename A, typename B, template <typename, typename> typename Operation, typename ResultType_, bool _check_overflow = true>
+template <template <typename, typename> typename Operation, typename ResultType_, bool check_overflow = true>
 struct DecimalBinaryOperation
 {
     static constexpr bool is_plus_minus =   IsOperation<Operation>::plus ||
@@ -196,48 +204,10 @@ struct DecimalBinaryOperation
     using Op = std::conditional_t<is_float_division,
         DivideIntegralImpl<NativeResultType, NativeResultType>, /// substitute divide by intDiv (throw on division by zero)
         Operation<NativeResultType, NativeResultType>>;
-    using ColVecA = std::conditional_t<IsDecimalNumber<A>, ColumnDecimal<A>, ColumnVector<A>>;
-    using ColVecB = std::conditional_t<IsDecimalNumber<B>, ColumnDecimal<B>, ColumnVector<B>>;
-    using ArrayA = typename ColVecA::Container;
-    using ArrayB = typename ColVecB::Container;
+
     using ArrayC = typename ColumnDecimal<ResultType>::Container;
-    using SelfNoOverflow = DecimalBinaryOperation<A, B, Operation, ResultType_, false>;
-
-    static void vectorVector(const ArrayA & a, const ArrayB & b, ArrayC & c,
-                             NativeResultType scale_a, NativeResultType scale_b, bool check_overflow)
-    {
-        if (check_overflow)
-            vectorVector(a, b, c, scale_a, scale_b);
-        else
-            SelfNoOverflow::vectorVector(a, b, c, scale_a, scale_b);
-    }
-
-    static void vectorConstant(const ArrayA & a, B b, ArrayC & c,
-                               NativeResultType scale_a, NativeResultType scale_b, bool check_overflow)
-    {
-        if (check_overflow)
-            vectorConstant(a, b, c, scale_a, scale_b);
-        else
-            SelfNoOverflow::vectorConstant(a, b, c, scale_a, scale_b);
-    }
-
-    static void constantVector(A a, const ArrayB & b, ArrayC & c,
-                               NativeResultType scale_a, NativeResultType scale_b, bool check_overflow)
-    {
-        if (check_overflow)
-            constantVector(a, b, c, scale_a, scale_b);
-        else
-            SelfNoOverflow::constantVector(a, b, c, scale_a, scale_b);
-    }
-
-    static ResultType constantConstant(A a, B b, NativeResultType scale_a, NativeResultType scale_b, bool check_overflow)
-    {
-        if (check_overflow)
-            return constantConstant(a, b, scale_a, scale_b);
-        else
-            return SelfNoOverflow::constantConstant(a, b, scale_a, scale_b);
-    }
 
+    template <bool is_decimal_a, bool is_decimal_b, typename ArrayA, typename ArrayB>
     static void NO_INLINE vectorVector(const ArrayA & a, const ArrayB & b, ArrayC & c,
                                        NativeResultType scale_a [[maybe_unused]], NativeResultType scale_b [[maybe_unused]])
     {
@@ -247,92 +217,102 @@ struct DecimalBinaryOperation
             if (scale_a != 1)
             {
                 for (size_t i = 0; i < size; ++i)
-                    c[i] = applyScaled<true>(a[i], b[i], scale_a);
+                    c[i] = applyScaled<true>(undec(a[i]), undec(b[i]), scale_a);
                 return;
             }
             else if (scale_b != 1)
             {
                 for (size_t i = 0; i < size; ++i)
-                    c[i] = applyScaled<false>(a[i], b[i], scale_b);
+                    c[i] = applyScaled<false>(undec(a[i]), undec(b[i]), scale_b);
                 return;
             }
         }
-        else if constexpr (is_division && IsDecimalNumber<B>)
+        else if constexpr (is_division && is_decimal_b)
         {
             for (size_t i = 0; i < size; ++i)
-                c[i] = applyScaledDiv(a[i], b[i], scale_a);
+                c[i] = applyScaledDiv<is_decimal_a>(undec(a[i]), undec(b[i]), scale_a);
             return;
         }
 
         /// default: use it if no return before
         for (size_t i = 0; i < size; ++i)
-            c[i] = apply(a[i], b[i]);
+            c[i] = apply(undec(a[i]), undec(b[i]));
     }
 
+    template <bool is_decimal_a, bool is_decimal_b, typename ArrayA, typename B>
     static void NO_INLINE vectorConstant(const ArrayA & a, B b, ArrayC & c,
                                          NativeResultType scale_a [[maybe_unused]], NativeResultType scale_b [[maybe_unused]])
     {
+        static_assert(!IsDecimalNumber<B>);
+
         size_t size = a.size();
         if constexpr (is_plus_minus_compare)
         {
             if (scale_a != 1)
             {
                 for (size_t i = 0; i < size; ++i)
-                    c[i] = applyScaled<true>(a[i], b, scale_a);
+                    c[i] = applyScaled<true>(undec(a[i]), b, scale_a);
                 return;
             }
             else if (scale_b != 1)
             {
                 for (size_t i = 0; i < size; ++i)
-                    c[i] = applyScaled<false>(a[i], b, scale_b);
+                    c[i] = applyScaled<false>(undec(a[i]), b, scale_b);
                 return;
             }
         }
-        else if constexpr (is_division && IsDecimalNumber<B>)
+        else if constexpr (is_division && is_decimal_b)
         {
             for (size_t i = 0; i < size; ++i)
-                c[i] = applyScaledDiv(a[i], b, scale_a);
+                c[i] = applyScaledDiv<is_decimal_a>(undec(a[i]), b, scale_a);
             return;
         }
 
         /// default: use it if no return before
         for (size_t i = 0; i < size; ++i)
-            c[i] = apply(a[i], b);
+            c[i] = apply(undec(a[i]), b);
     }
 
+    template <bool is_decimal_a, bool is_decimal_b, typename A, typename ArrayB>
     static void NO_INLINE constantVector(A a, const ArrayB & b, ArrayC & c,
                                          NativeResultType scale_a [[maybe_unused]], NativeResultType scale_b [[maybe_unused]])
     {
+        static_assert(!IsDecimalNumber<A>);
+
         size_t size = b.size();
         if constexpr (is_plus_minus_compare)
         {
             if (scale_a != 1)
             {
                 for (size_t i = 0; i < size; ++i)
-                    c[i] = applyScaled<true>(a, b[i], scale_a);
+                    c[i] = applyScaled<true>(a, undec(b[i]), scale_a);
                 return;
             }
             else if (scale_b != 1)
             {
                 for (size_t i = 0; i < size; ++i)
-                    c[i] = applyScaled<false>(a, b[i], scale_b);
+                    c[i] = applyScaled<false>(a, undec(b[i]), scale_b);
                 return;
             }
         }
-        else if constexpr (is_division && IsDecimalNumber<B>)
+        else if constexpr (is_division && is_decimal_b)
         {
             for (size_t i = 0; i < size; ++i)
-                c[i] = applyScaledDiv(a, b[i], scale_a);
+                c[i] = applyScaledDiv<is_decimal_a>(a, undec(b[i]), scale_a);
             return;
         }
 
         /// default: use it if no return before
         for (size_t i = 0; i < size; ++i)
-            c[i] = apply(a, b[i]);
+            c[i] = apply(a, undec(b[i]));
     }
 
+    template <bool is_decimal_a, bool is_decimal_b, typename A, typename B>
     static ResultType constantConstant(A a, B b, NativeResultType scale_a [[maybe_unused]], NativeResultType scale_b [[maybe_unused]])
     {
+        static_assert(!IsDecimalNumber<A>);
+        static_assert(!IsDecimalNumber<B>);
+
         if constexpr (is_plus_minus_compare)
         {
             if (scale_a != 1)
@@ -340,64 +320,16 @@ struct DecimalBinaryOperation
             else if (scale_b != 1)
                 return applyScaled<false>(a, b, scale_b);
         }
-        else if constexpr (is_division && IsDecimalNumber<B>)
-            return applyScaledDiv(a, b, scale_a);
+        else if constexpr (is_division && is_decimal_b)
+            return applyScaledDiv<is_decimal_a>(a, b, scale_a);
         return apply(a, b);
     }
 
 private:
-    template <typename T, typename U>
-    static NativeResultType apply(const T & a, const U & b)
-    {
-        if constexpr (OverBigInt<T> || OverBigInt<U>)
-        {
-            if constexpr (IsDecimalNumber<T>)
-                return apply(a.value, b);
-            else if constexpr (IsDecimalNumber<U>)
-                return apply(a, b.value);
-            else
-                return applyNative(bigint_cast<NativeResultType>(a), bigint_cast<NativeResultType>(b));
-        }
-        else
-            return applyNative(a, b);
-    }
-
-    template <bool scale_left, typename T, typename U>
-    static NativeResultType applyScaled(const T & a, const U & b, NativeResultType scale)
-    {
-        if constexpr (OverBigInt<T> || OverBigInt<U>)
-        {
-            if constexpr (IsDecimalNumber<T>)
-                return applyScaled<scale_left>(a.value, b, scale);
-            else if constexpr (IsDecimalNumber<U>)
-                return applyScaled<scale_left>(a, b.value, scale);
-            else
-                return applyNativeScaled<scale_left>(bigint_cast<NativeResultType>(a), bigint_cast<NativeResultType>(b), scale);
-        }
-        else
-            return applyNativeScaled<scale_left>(a, b, scale);
-    }
-
-    template <typename T, typename U>
-    static NativeResultType applyScaledDiv(const T & a, const U & b, NativeResultType scale)
-    {
-        if constexpr (OverBigInt<T> || OverBigInt<U>)
-        {
-            if constexpr (IsDecimalNumber<T>)
-                return applyScaledDiv(a.value, b, scale);
-            else if constexpr (IsDecimalNumber<U>)
-                return applyScaledDiv(a, b.value, scale);
-            else
-                return applyNativeScaledDiv(bigint_cast<NativeResultType>(a), bigint_cast<NativeResultType>(b), scale);
-        }
-        else
-            return applyNativeScaledDiv(a, b, scale);
-    }
-
     /// there's implicit type convertion here
-    static NativeResultType applyNative(NativeResultType a, NativeResultType b)
+    static NativeResultType apply(NativeResultType a, NativeResultType b)
     {
-        if constexpr (can_overflow && _check_overflow)
+        if constexpr (can_overflow && check_overflow)
         {
             NativeResultType res;
             if (Op::template apply<NativeResultType>(a, b, res))
@@ -409,13 +341,13 @@ private:
     }
 
     template <bool scale_left>
-    static NO_SANITIZE_UNDEFINED NativeResultType applyNativeScaled(NativeResultType a, NativeResultType b, NativeResultType scale)
+    static NO_SANITIZE_UNDEFINED NativeResultType applyScaled(NativeResultType a, NativeResultType b, NativeResultType scale)
     {
         if constexpr (is_plus_minus_compare)
         {
             NativeResultType res;
 
-            if constexpr (_check_overflow)
+            if constexpr (check_overflow)
             {
                 bool overflow = false;
                 if constexpr (scale_left)
@@ -444,14 +376,15 @@ private:
         }
     }
 
-    static NO_SANITIZE_UNDEFINED NativeResultType applyNativeScaledDiv(NativeResultType a, NativeResultType b, NativeResultType scale)
+    template <bool is_decimal_a>
+    static NO_SANITIZE_UNDEFINED NativeResultType applyScaledDiv(NativeResultType a, NativeResultType b, NativeResultType scale)
     {
         if constexpr (is_division)
         {
-            if constexpr (_check_overflow)
+            if constexpr (check_overflow)
             {
                 bool overflow = false;
-                if constexpr (!IsDecimalNumber<A>)
+                if constexpr (!is_decimal_a)
                     overflow |= common::mulOverflow(scale, scale, scale);
                 overflow |= common::mulOverflow(a, scale, a);
                 if (overflow)
@@ -459,7 +392,7 @@ private:
             }
             else
             {
-                if constexpr (!IsDecimalNumber<A>)
+                if constexpr (!is_decimal_a)
                     scale *= scale;
                 a *= scale;
             }
@@ -1024,10 +957,15 @@ public:
 
             if constexpr (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>)
             {
-                using OpImpl = DecimalBinaryOperation<T0, T1, Op, ResultType>;
+                using NativeResultType = typename NativeType<ResultType>::Type;
+                using OpImpl = DecimalBinaryOperation<Op, ResultType, false>;
+                using OpImplCheck = DecimalBinaryOperation<Op, ResultType, true>;
 
                 ResultDataType type = decimalResultType<is_multiply, is_division>(left, right);
 
+                static constexpr const bool dec_a = IsDecimalNumber<T0>;
+                static constexpr const bool dec_b = IsDecimalNumber<T1>;
+
                 typename ResultDataType::FieldType scale_a = type.scaleFactorFor(left, is_multiply);
                 typename ResultDataType::FieldType scale_b = type.scaleFactorFor(right, is_multiply || is_division);
                 if constexpr (IsDataTypeDecimal<RightDataType> && is_division)
@@ -1036,8 +974,12 @@ public:
                 /// non-vector result
                 if (col_left_const && col_right_const)
                 {
-                    auto res = OpImpl::constantConstant(col_left_const->template getValue<T0>(), col_right_const->template getValue<T1>(),
-                                                        scale_a, scale_b, check_decimal_overflow);
+                    NativeResultType const_a = col_left_const->template getValue<T0>();
+                    NativeResultType const_b = col_right_const->template getValue<T1>();
+
+                    auto res = check_decimal_overflow ?
+                        OpImplCheck::template constantConstant<dec_a, dec_b>(const_a, const_b, scale_a, scale_b) :
+                        OpImpl::template constantConstant<dec_a, dec_b>(const_a, const_b, scale_a, scale_b);
 
                     block.getByPosition(result).column = ResultDataType(type.getPrecision(), type.getScale()).createColumnConst(
                             col_left_const->size(), toField(res, type.getScale()));
@@ -1050,17 +992,28 @@ public:
 
                 if (col_left && col_right)
                 {
-                    OpImpl::vectorVector(col_left->getData(), col_right->getData(), vec_res, scale_a, scale_b, check_decimal_overflow);
+                    if (check_decimal_overflow)
+                        OpImplCheck::template vectorVector<dec_a, dec_b>(col_left->getData(), col_right->getData(), vec_res, scale_a, scale_b);
+                    else
+                        OpImpl::template vectorVector<dec_a, dec_b>(col_left->getData(), col_right->getData(), vec_res, scale_a, scale_b);
                 }
                 else if (col_left_const && col_right)
                 {
-                    OpImpl::constantVector(col_left_const->template getValue<T0>(), col_right->getData(), vec_res,
-                                           scale_a, scale_b, check_decimal_overflow);
+                    NativeResultType const_a = col_left_const->template getValue<T0>();
+
+                    if (check_decimal_overflow)
+                        OpImplCheck::template constantVector<dec_a, dec_b>(const_a, col_right->getData(), vec_res, scale_a, scale_b);
+                    else
+                        OpImpl::template constantVector<dec_a, dec_b>(const_a, col_right->getData(), vec_res, scale_a, scale_b);
                 }
                 else if (col_left && col_right_const)
                 {
-                    OpImpl::vectorConstant(col_left->getData(), col_right_const->template getValue<T1>(), vec_res,
-                                           scale_a, scale_b, check_decimal_overflow);
+                    NativeResultType const_b = col_right_const->template getValue<T1>();
+
+                    if (check_decimal_overflow)
+                        OpImplCheck::template vectorConstant<dec_a, dec_b>(col_left->getData(), const_b, vec_res, scale_a, scale_b);
+                    else
+                        OpImpl::template vectorConstant<dec_a, dec_b>(col_left->getData(), const_b, vec_res, scale_a, scale_b);
                 }
                 else
                     return false;
diff --git a/src/Functions/intDiv.cpp b/src/Functions/intDiv.cpp
index 45fb8bd51bd..25c21f8439c 100644
--- a/src/Functions/intDiv.cpp
+++ b/src/Functions/intDiv.cpp
@@ -22,7 +22,7 @@ namespace
 
 template <typename A, typename B>
 struct DivideIntegralByConstantImpl
-    : BinaryOperationImplBase<A, B, DivideIntegralImpl<A, B>>
+    : BinaryOperation<A, B, DivideIntegralImpl<A, B>>
 {
     using ResultType = typename DivideIntegralImpl<A, B>::ResultType;
     static const constexpr bool allow_fixed_string = false;
diff --git a/src/Functions/modulo.cpp b/src/Functions/modulo.cpp
index 2f9bf8a9c3a..1458d20c131 100644
--- a/src/Functions/modulo.cpp
+++ b/src/Functions/modulo.cpp
@@ -22,7 +22,7 @@ namespace
 
 template <typename A, typename B>
 struct ModuloByConstantImpl
-    : BinaryOperationImplBase<A, B, ModuloImpl<A, B>>
+    : BinaryOperation<A, B, ModuloImpl<A, B>>
 {
     using ResultType = typename ModuloImpl<A, B>::ResultType;
     static const constexpr bool allow_fixed_string = false;

From 6eac433c5544b5675ad26bff86793b925e7a2b5f Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 13:40:39 +0300
Subject: [PATCH 236/341] Review fixes.

---
 src/DataStreams/IBlockInputStream.h           |  8 +--
 .../{LocalLimits.h => StreamLocalLimits.h}    |  2 +-
 src/Interpreters/InterpreterSelectQuery.cpp   | 60 ++++++++++---------
 src/Interpreters/InterpreterWatchQuery.cpp    |  4 +-
 src/Interpreters/executeQuery.cpp             |  2 +-
 .../PipelineExecutingBlockInputStream.cpp     |  2 +-
 .../PipelineExecutingBlockInputStream.h       |  2 +-
 src/Processors/Pipe.cpp                       |  2 +-
 src/Processors/Pipe.h                         |  4 +-
 .../QueryPlan/PartialSortingStep.cpp          |  2 +-
 .../QueryPlan/ReadFromStorageStep.cpp         |  2 +-
 .../QueryPlan/ReadFromStorageStep.h           |  6 +-
 .../Sources/SourceFromInputStream.h           |  2 +-
 src/Processors/Sources/SourceWithProgress.h   |  8 +--
 .../Transforms/LimitsCheckingTransform.cpp    |  2 +-
 .../Transforms/LimitsCheckingTransform.h      |  6 +-
 src/Storages/IStorage.cpp                     |  2 +-
 src/Storages/IStorage.h                       |  2 +-
 src/Storages/Kafka/StorageKafka.cpp           |  2 +-
 src/Storages/RabbitMQ/StorageRabbitMQ.cpp     |  2 +-
 20 files changed, 64 insertions(+), 58 deletions(-)
 rename src/DataStreams/{LocalLimits.h => StreamLocalLimits.h} (97%)

diff --git a/src/DataStreams/IBlockInputStream.h b/src/DataStreams/IBlockInputStream.h
index f2aa4dd1b5c..3fbc3ce4bcd 100644
--- a/src/DataStreams/IBlockInputStream.h
+++ b/src/DataStreams/IBlockInputStream.h
@@ -5,7 +5,7 @@
 #include <DataStreams/IBlockStream_fwd.h>
 #include <DataStreams/SizeLimits.h>
 #include <DataStreams/ExecutionSpeedLimits.h>
-#include <DataStreams/LocalLimits.h>
+#include <DataStreams/StreamLocalLimits.h>
 #include <IO/Progress.h>
 #include <Storages/TableLockHolder.h>
 #include <Common/TypePromotion.h>
@@ -175,12 +175,12 @@ public:
     bool isCancelledOrThrowIfKilled() const;
 
     /** Set limitations that checked on each block. */
-    virtual void setLimits(const LocalLimits & limits_)
+    virtual void setLimits(const StreamLocalLimits & limits_)
     {
         limits = limits_;
     }
 
-    const LocalLimits & getLimits() const
+    const StreamLocalLimits & getLimits() const
     {
         return limits;
     }
@@ -244,7 +244,7 @@ private:
 
     /// Limitations and quotas.
 
-    LocalLimits limits;
+    StreamLocalLimits limits;
 
     std::shared_ptr<const EnabledQuota> quota;    /// If nullptr - the quota is not used.
     UInt64 prev_elapsed = 0;
diff --git a/src/DataStreams/LocalLimits.h b/src/DataStreams/StreamLocalLimits.h
similarity index 97%
rename from src/DataStreams/LocalLimits.h
rename to src/DataStreams/StreamLocalLimits.h
index a82c93f1894..efda6a941cc 100644
--- a/src/DataStreams/LocalLimits.h
+++ b/src/DataStreams/StreamLocalLimits.h
@@ -19,7 +19,7 @@ enum class LimitsMode
 };
 
 /// It is a subset of limitations from Limits.
-struct LocalLimits
+struct StreamLocalLimits
 {
     LimitsMode mode = LimitsMode::LIMITS_CURRENT;
 
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 98a258a0c35..bd291179f31 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -1071,6 +1071,37 @@ void InterpreterSelectQuery::executeImpl(QueryPlan & query_plan, const BlockInpu
         executeSubqueriesInSetsAndJoins(query_plan, subqueries_for_sets);
 }
 
+static StreamLocalLimits getLimitsForStorage(const Settings & settings, const SelectQueryOptions & options)
+{
+    StreamLocalLimits limits;
+    limits.mode = LimitsMode::LIMITS_TOTAL;
+    limits.size_limits = SizeLimits(settings.max_rows_to_read, settings.max_bytes_to_read,
+                                    settings.read_overflow_mode);
+    limits.speed_limits.max_execution_time = settings.max_execution_time;
+    limits.timeout_overflow_mode = settings.timeout_overflow_mode;
+
+    /** Quota and minimal speed restrictions are checked on the initiating server of the request, and not on remote servers,
+      *  because the initiating server has a summary of the execution of the request on all servers.
+      *
+      * But limits on data size to read and maximum execution time are reasonable to check both on initiator and
+      *  additionally on each remote server, because these limits are checked per block of data processed,
+      *  and remote servers may process way more blocks of data than are received by initiator.
+      *
+      * The limits to throttle maximum execution speed is also checked on all servers.
+      */
+    if (options.to_stage == QueryProcessingStage::Complete)
+    {
+        limits.speed_limits.min_execution_rps = settings.min_execution_speed;
+        limits.speed_limits.min_execution_bps = settings.min_execution_speed_bytes;
+    }
+
+    limits.speed_limits.max_execution_rps = settings.max_execution_speed;
+    limits.speed_limits.max_execution_bps = settings.max_execution_speed_bytes;
+    limits.speed_limits.timeout_before_checking_execution_speed = settings.timeout_before_checking_execution_speed;
+
+    return limits;
+}
+
 void InterpreterSelectQuery::executeFetchColumns(
     QueryProcessingStage::Enum processing_stage, QueryPlan & query_plan,
     const PrewhereInfoPtr & prewhere_info, const Names & columns_to_remove_after_prewhere)
@@ -1409,37 +1440,12 @@ void InterpreterSelectQuery::executeFetchColumns(
             query_info.input_order_info = query_info.order_optimizer->getInputOrder(storage, metadata_snapshot);
         }
 
-        LocalLimits limits;
+        StreamLocalLimits limits;
         std::shared_ptr<const EnabledQuota> quota;
 
         /// Set the limits and quota for reading data, the speed and time of the query.
         if (!options.ignore_limits)
-        {
-            limits.mode = LimitsMode::LIMITS_TOTAL;
-            limits.size_limits = SizeLimits(settings.max_rows_to_read, settings.max_bytes_to_read,
-                                            settings.read_overflow_mode);
-            limits.speed_limits.max_execution_time = settings.max_execution_time;
-            limits.timeout_overflow_mode = settings.timeout_overflow_mode;
-
-            /** Quota and minimal speed restrictions are checked on the initiating server of the request, and not on remote servers,
-              *  because the initiating server has a summary of the execution of the request on all servers.
-              *
-              * But limits on data size to read and maximum execution time are reasonable to check both on initiator and
-              *  additionally on each remote server, because these limits are checked per block of data processed,
-              *  and remote servers may process way more blocks of data than are received by initiator.
-              *
-              * The limits to throttle maximum execution speed is also checked on all servers.
-              */
-            if (options.to_stage == QueryProcessingStage::Complete)
-            {
-                limits.speed_limits.min_execution_rps = settings.min_execution_speed;
-                limits.speed_limits.min_execution_bps = settings.min_execution_speed_bytes;
-            }
-
-            limits.speed_limits.max_execution_rps = settings.max_execution_speed;
-            limits.speed_limits.max_execution_bps = settings.max_execution_speed_bytes;
-            limits.speed_limits.timeout_before_checking_execution_speed = settings.timeout_before_checking_execution_speed;
-        }
+            limits = getLimitsForStorage(settings, options);
 
         if (!options.ignore_quota && (options.to_stage == QueryProcessingStage::Complete))
             quota = context->getQuota();
diff --git a/src/Interpreters/InterpreterWatchQuery.cpp b/src/Interpreters/InterpreterWatchQuery.cpp
index caf67523fc9..30316a2dd79 100644
--- a/src/Interpreters/InterpreterWatchQuery.cpp
+++ b/src/Interpreters/InterpreterWatchQuery.cpp
@@ -17,7 +17,7 @@ limitations under the License. */
 #include <Access/AccessFlags.h>
 #include <DataStreams/IBlockInputStream.h>
 #include <DataStreams/OneBlockInputStream.h>
-#include <DataStreams/LocalLimits.h>
+#include <DataStreams/StreamLocalLimits.h>
 
 
 namespace DB
@@ -77,7 +77,7 @@ BlockIO InterpreterWatchQuery::execute()
     /// Constraints on the result, the quota on the result, and also callback for progress.
     if (IBlockInputStream * stream = dynamic_cast<IBlockInputStream *>(streams[0].get()))
     {
-        LocalLimits limits;
+        StreamLocalLimits limits;
         limits.mode = LimitsMode::LIMITS_CURRENT;
         limits.size_limits.max_rows = settings.max_result_rows;
         limits.size_limits.max_bytes = settings.max_result_bytes;
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index bcf77fdf700..5097e517707 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -382,7 +382,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
             }
         }
 
-        LocalLimits limits;
+        StreamLocalLimits limits;
         if (!interpreter->ignoreLimits())
         {
             limits.mode = LimitsMode::LIMITS_CURRENT;
diff --git a/src/Processors/Executors/PipelineExecutingBlockInputStream.cpp b/src/Processors/Executors/PipelineExecutingBlockInputStream.cpp
index 3f6ff2f7576..458fa0a0a90 100644
--- a/src/Processors/Executors/PipelineExecutingBlockInputStream.cpp
+++ b/src/Processors/Executors/PipelineExecutingBlockInputStream.cpp
@@ -103,7 +103,7 @@ void PipelineExecutingBlockInputStream::setProcessListElement(QueryStatus * elem
     pipeline->setProcessListElement(elem);
 }
 
-void PipelineExecutingBlockInputStream::setLimits(const LocalLimits & limits_)
+void PipelineExecutingBlockInputStream::setLimits(const StreamLocalLimits & limits_)
 {
     throwIfExecutionStarted(is_execution_started, "setLimits");
 
diff --git a/src/Processors/Executors/PipelineExecutingBlockInputStream.h b/src/Processors/Executors/PipelineExecutingBlockInputStream.h
index 7e8c30eabd7..e37ad41f6ab 100644
--- a/src/Processors/Executors/PipelineExecutingBlockInputStream.h
+++ b/src/Processors/Executors/PipelineExecutingBlockInputStream.h
@@ -24,7 +24,7 @@ public:
     /// Implement IBlockInputStream methods via QueryPipeline.
     void setProgressCallback(const ProgressCallback & callback) final;
     void setProcessListElement(QueryStatus * elem) final;
-    void setLimits(const LocalLimits & limits_) final;
+    void setLimits(const StreamLocalLimits & limits_) final;
     void setQuota(const std::shared_ptr<const EnabledQuota> & quota_) final;
     void addTotalRowsApprox(size_t value) final;
 
diff --git a/src/Processors/Pipe.cpp b/src/Processors/Pipe.cpp
index 69433ab3b7c..90a8a65ff25 100644
--- a/src/Processors/Pipe.cpp
+++ b/src/Processors/Pipe.cpp
@@ -779,7 +779,7 @@ void Pipe::transform(const Transformer & transformer)
     max_parallel_streams = std::max<size_t>(max_parallel_streams, output_ports.size());
 }
 
-void Pipe::setLimits(const LocalLimits & limits)
+void Pipe::setLimits(const StreamLocalLimits & limits)
 {
     for (auto & processor : processors)
     {
diff --git a/src/Processors/Pipe.h b/src/Processors/Pipe.h
index c1bfb6a0e1e..4adb529bb1e 100644
--- a/src/Processors/Pipe.h
+++ b/src/Processors/Pipe.h
@@ -6,7 +6,7 @@
 namespace DB
 {
 
-struct LocalLimits;
+struct StreamLocalLimits;
 
 class Pipe;
 using Pipes = std::vector<Pipe>;
@@ -96,7 +96,7 @@ public:
     const Processors & getProcessors() const { return processors; }
 
     /// Specify quotas and limits for every ISourceWithProgress.
-    void setLimits(const LocalLimits & limits);
+    void setLimits(const StreamLocalLimits & limits);
     void setQuota(const std::shared_ptr<const EnabledQuota> & quota);
 
     /// Do not allow to change the table while the processors of pipe are alive.
diff --git a/src/Processors/QueryPlan/PartialSortingStep.cpp b/src/Processors/QueryPlan/PartialSortingStep.cpp
index 8014445b899..ce34eca9112 100644
--- a/src/Processors/QueryPlan/PartialSortingStep.cpp
+++ b/src/Processors/QueryPlan/PartialSortingStep.cpp
@@ -56,7 +56,7 @@ void PartialSortingStep::transformPipeline(QueryPipeline & pipeline)
         return std::make_shared<PartialSortingTransform>(header, sort_description, limit);
     });
 
-    LocalLimits limits;
+    StreamLocalLimits limits;
     limits.mode = LimitsMode::LIMITS_CURRENT;
     limits.size_limits = size_limits;
 
diff --git a/src/Processors/QueryPlan/ReadFromStorageStep.cpp b/src/Processors/QueryPlan/ReadFromStorageStep.cpp
index 61b160f7e77..2f305e7220c 100644
--- a/src/Processors/QueryPlan/ReadFromStorageStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromStorageStep.cpp
@@ -14,7 +14,7 @@ namespace DB
 ReadFromStorageStep::ReadFromStorageStep(
     TableLockHolder table_lock_,
     StorageMetadataPtr metadata_snapshot_,
-    LocalLimits & limits_,
+    StreamLocalLimits & limits_,
     std::shared_ptr<const EnabledQuota> quota_,
     StoragePtr storage_,
     const Names & required_columns_,
diff --git a/src/Processors/QueryPlan/ReadFromStorageStep.h b/src/Processors/QueryPlan/ReadFromStorageStep.h
index 064e4713099..9c2b9e56450 100644
--- a/src/Processors/QueryPlan/ReadFromStorageStep.h
+++ b/src/Processors/QueryPlan/ReadFromStorageStep.h
@@ -1,7 +1,7 @@
 #include <Processors/QueryPlan/IQueryPlanStep.h>
 #include <Core/QueryProcessingStage.h>
 #include <Storages/TableLockHolder.h>
-#include <DataStreams/LocalLimits.h>
+#include <DataStreams/StreamLocalLimits.h>
 
 namespace DB
 {
@@ -25,7 +25,7 @@ public:
     ReadFromStorageStep(
         TableLockHolder table_lock,
         StorageMetadataPtr metadata_snapshot,
-        LocalLimits & limits,
+        StreamLocalLimits & limits,
         std::shared_ptr<const EnabledQuota> quota,
         StoragePtr storage,
         const Names & required_columns,
@@ -46,7 +46,7 @@ public:
 private:
     TableLockHolder table_lock;
     StorageMetadataPtr metadata_snapshot;
-    LocalLimits limits;
+    StreamLocalLimits limits;
     std::shared_ptr<const EnabledQuota> quota;
 
     StoragePtr storage;
diff --git a/src/Processors/Sources/SourceFromInputStream.h b/src/Processors/Sources/SourceFromInputStream.h
index 9d0acb74943..630c712daef 100644
--- a/src/Processors/Sources/SourceFromInputStream.h
+++ b/src/Processors/Sources/SourceFromInputStream.h
@@ -32,7 +32,7 @@ public:
     void setRowsBeforeLimitCounter(RowsBeforeLimitCounterPtr counter) { rows_before_limit.swap(counter); }
 
     /// Implementation for methods from ISourceWithProgress.
-    void setLimits(const LocalLimits & limits_) final { stream->setLimits(limits_); }
+    void setLimits(const StreamLocalLimits & limits_) final { stream->setLimits(limits_); }
     void setQuota(const std::shared_ptr<const EnabledQuota> & quota_) final { stream->setQuota(quota_); }
     void setProcessListElement(QueryStatus * elem) final { stream->setProcessListElement(elem); }
     void setProgressCallback(const ProgressCallback & callback) final { stream->setProgressCallback(callback); }
diff --git a/src/Processors/Sources/SourceWithProgress.h b/src/Processors/Sources/SourceWithProgress.h
index 04e22d57c9c..fdab345548b 100644
--- a/src/Processors/Sources/SourceWithProgress.h
+++ b/src/Processors/Sources/SourceWithProgress.h
@@ -2,7 +2,7 @@
 #include <Processors/ISource.h>
 #include <DataStreams/IBlockInputStream.h>
 #include <Common/Stopwatch.h>
-#include <DataStreams/LocalLimits.h>
+#include <DataStreams/StreamLocalLimits.h>
 
 namespace DB
 {
@@ -15,7 +15,7 @@ public:
     using ISource::ISource;
 
     /// Set limitations that checked on each chunk.
-    virtual void setLimits(const LocalLimits & limits_) = 0;
+    virtual void setLimits(const StreamLocalLimits & limits_) = 0;
 
     /// Set the quota. If you set a quota on the amount of raw data,
     /// then you should also set mode = LIMITS_TOTAL to LocalLimits with setLimits.
@@ -45,7 +45,7 @@ public:
     /// If enable_auto_progress flag is set, progress() will be automatically called on each generated chunk.
     SourceWithProgress(Block header, bool enable_auto_progress);
 
-    void setLimits(const LocalLimits & limits_) final { limits = limits_; }
+    void setLimits(const StreamLocalLimits & limits_) final { limits = limits_; }
     void setQuota(const std::shared_ptr<const EnabledQuota> & quota_) final { quota = quota_; }
     void setProcessListElement(QueryStatus * elem) final { process_list_elem = elem; }
     void setProgressCallback(const ProgressCallback & callback) final { progress_callback = callback; }
@@ -58,7 +58,7 @@ protected:
     void work() override;
 
 private:
-    LocalLimits limits;
+    StreamLocalLimits limits;
     std::shared_ptr<const EnabledQuota> quota;
     ProgressCallback progress_callback;
     QueryStatus * process_list_elem = nullptr;
diff --git a/src/Processors/Transforms/LimitsCheckingTransform.cpp b/src/Processors/Transforms/LimitsCheckingTransform.cpp
index 56edd5f0317..9e021e8e59d 100644
--- a/src/Processors/Transforms/LimitsCheckingTransform.cpp
+++ b/src/Processors/Transforms/LimitsCheckingTransform.cpp
@@ -18,7 +18,7 @@ void ProcessorProfileInfo::update(const Chunk & block)
     bytes += block.bytes();
 }
 
-LimitsCheckingTransform::LimitsCheckingTransform(const Block & header_, LocalLimits limits_)
+LimitsCheckingTransform::LimitsCheckingTransform(const Block & header_, StreamLocalLimits limits_)
     : ISimpleTransform(header_, header_, false)
     , limits(std::move(limits_))
 {
diff --git a/src/Processors/Transforms/LimitsCheckingTransform.h b/src/Processors/Transforms/LimitsCheckingTransform.h
index 404a1320d55..9de5cbf5125 100644
--- a/src/Processors/Transforms/LimitsCheckingTransform.h
+++ b/src/Processors/Transforms/LimitsCheckingTransform.h
@@ -4,7 +4,7 @@
 #include <Poco/Timespan.h>
 #include <Interpreters/ProcessList.h>
 
-#include <DataStreams/LocalLimits.h>
+#include <DataStreams/StreamLocalLimits.h>
 
 namespace DB
 {
@@ -26,7 +26,7 @@ class LimitsCheckingTransform : public ISimpleTransform
 {
 public:
 
-    LimitsCheckingTransform(const Block & header_, LocalLimits limits_);
+    LimitsCheckingTransform(const Block & header_, StreamLocalLimits limits_);
 
     String getName() const override { return "LimitsCheckingTransform"; }
 
@@ -36,7 +36,7 @@ protected:
     void transform(Chunk & chunk) override;
 
 private:
-    LocalLimits limits;
+    StreamLocalLimits limits;
 
     std::shared_ptr<const EnabledQuota> quota;
     UInt64 prev_elapsed = 0;
diff --git a/src/Storages/IStorage.cpp b/src/Storages/IStorage.cpp
index 76033a93bf5..0711d32d802 100644
--- a/src/Storages/IStorage.cpp
+++ b/src/Storages/IStorage.cpp
@@ -96,7 +96,7 @@ void IStorage::read(
         QueryPlan & query_plan,
         TableLockHolder table_lock,
         StorageMetadataPtr metadata_snapshot,
-        LocalLimits & limits,
+        StreamLocalLimits & limits,
         std::shared_ptr<const EnabledQuota> quota,
         const Names & column_names,
         const SelectQueryInfo & query_info,
diff --git a/src/Storages/IStorage.h b/src/Storages/IStorage.h
index 02262a67e8f..dc7c684d5b4 100644
--- a/src/Storages/IStorage.h
+++ b/src/Storages/IStorage.h
@@ -287,7 +287,7 @@ public:
         QueryPlan & query_plan,
         TableLockHolder table_lock,
         StorageMetadataPtr metadata_snapshot,
-        LocalLimits & limits,
+        StreamLocalLimits & limits,
         std::shared_ptr<const EnabledQuota> quota,
         const Names & column_names,
         const SelectQueryInfo & query_info,
diff --git a/src/Storages/Kafka/StorageKafka.cpp b/src/Storages/Kafka/StorageKafka.cpp
index e35407bd6be..9ba5ad7a65b 100644
--- a/src/Storages/Kafka/StorageKafka.cpp
+++ b/src/Storages/Kafka/StorageKafka.cpp
@@ -565,7 +565,7 @@ bool StorageKafka::streamToViews()
         streams.emplace_back(stream);
 
         // Limit read batch to maximum block size to allow DDL
-        LocalLimits limits;
+        StreamLocalLimits limits;
 
         limits.speed_limits.max_execution_time = kafka_settings->kafka_flush_interval_ms.changed
                                                  ? kafka_settings->kafka_flush_interval_ms
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index 0272d8b064d..78aad9e6a2d 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -752,7 +752,7 @@ bool StorageRabbitMQ::streamToViews()
         streams.emplace_back(stream);
 
         // Limit read batch to maximum block size to allow DDL
-        LocalLimits limits;
+        StreamLocalLimits limits;
 
         limits.speed_limits.max_execution_time = rabbitmq_settings->rabbitmq_flush_interval_ms.changed
                                                   ? rabbitmq_settings->rabbitmq_flush_interval_ms

From 24dd33d5cbd6814c15d1ed7fc487988c46d66b16 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <36882414+akuzm@users.noreply.github.com>
Date: Tue, 15 Sep 2020 13:44:21 +0300
Subject: [PATCH 237/341] Update compare.sh

---
 docker/test/performance-comparison/compare.sh | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index db4939d529d..16aff19bc19 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -160,13 +160,13 @@ function run_tests
     # those values.
     if [ "$PR_TO_TEST" == "0" ]
     then
-        CHPC_TEST_RUNS=${CHPC_RUNS:-7}
-        CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-15}
+        CHPC_RUNS=${CHPC_RUNS:-7}
+        CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-100}
     else
-        CHPC_TEST_RUNS=${CHPC_RUNS:-13}
+        CHPC_RUNS=${CHPC_RUNS:-13}
         CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-0}
     fi
-    export CHPC_TEST_RUNS
+    export CHPC_RUNS
     export CHPC_MAX_QUERIES
 
     # Determine which concurrent benchmarks to run. For now, the only test

From 8828a781747abe78bb119775b381ccf5c53f50a7 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Tue, 15 Sep 2020 14:17:58 +0300
Subject: [PATCH 238/341] Fix alias on default columns

---
 .../MergeTree/MergeTreeBlockReadUtils.cpp     | 93 +++++++++++--------
 .../01084_defaults_on_aliases.reference       |  1 +
 .../0_stateless/01084_defaults_on_aliases.sql |  5 +-
 .../01497_alias_on_default_array.reference    |  6 ++
 .../01497_alias_on_default_array.sql          | 21 +++++
 5 files changed, 87 insertions(+), 39 deletions(-)
 create mode 100644 tests/queries/0_stateless/01497_alias_on_default_array.reference
 create mode 100644 tests/queries/0_stateless/01497_alias_on_default_array.sql

diff --git a/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp b/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
index 03235742a68..41610efafa5 100644
--- a/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
+++ b/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
@@ -12,59 +12,76 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
+namespace
+{
+
+/// Columns absent in part may depend on other absent columns so we are
+/// searching all required columns recursively. Return true if found at least
+/// one existing column in part.
+bool injectRequiredColumnsRecursively(
+    const String & column_name,
+    const ColumnsDescription & storage_columns,
+    const MergeTreeData::AlterConversions & alter_conversions,
+    const MergeTreeData::DataPartPtr & part,
+    Names & columns,
+    NameSet & required_columns,
+    NameSet & injected_columns)
+{
+    String column_name_in_part = column_name;
+    if (alter_conversions.isColumnRenamed(column_name_in_part))
+        column_name_in_part = alter_conversions.getColumnOldName(column_name_in_part);
+
+    /// column has files and hence does not require evaluation
+    if (storage_columns.hasPhysical(column_name) && part->hasColumnFiles(column_name_in_part, *storage_columns.getPhysical(column_name).type))
+    {
+        /// ensure each column is added only once
+        if (required_columns.count(column_name) == 0)
+        {
+            columns.emplace_back(column_name);
+            required_columns.emplace(column_name);
+            injected_columns.emplace(column_name);
+        }
+        return true;
+    }
+
+    /// Column doesn't have default value and don't exist in part
+    /// don't need to add to required set.
+    const auto column_default = storage_columns.getDefault(column_name);
+    if (!column_default)
+        return false;
+
+    /// collect identifiers required for evaluation
+    IdentifierNameSet identifiers;
+    column_default->expression->collectIdentifierNames(identifiers);
+
+    bool result = false;
+    for (const auto & identifier : identifiers)
+        result |= injectRequiredColumnsRecursively(identifier, storage_columns, alter_conversions, part, columns, required_columns, injected_columns);
+
+    return result;
+}
+
+}
 
 NameSet injectRequiredColumns(const MergeTreeData & storage, const StorageMetadataPtr & metadata_snapshot, const MergeTreeData::DataPartPtr & part, Names & columns)
 {
     NameSet required_columns{std::begin(columns), std::end(columns)};
     NameSet injected_columns;
 
-    auto all_column_files_missing = true;
+    bool have_at_least_one_physical_column = false;
 
     const auto & storage_columns = metadata_snapshot->getColumns();
     auto alter_conversions = storage.getAlterConversionsForPart(part);
     for (size_t i = 0; i < columns.size(); ++i)
-    {
-        /// possibly renamed
-        auto column_name_in_part = columns[i];
-
-        if (alter_conversions.isColumnRenamed(column_name_in_part))
-            column_name_in_part = alter_conversions.getColumnOldName(column_name_in_part);
-
-        /// column has files and hence does not require evaluation
-        if (part->hasColumnFiles(column_name_in_part, *storage_columns.getPhysical(columns[i]).type))
-        {
-            all_column_files_missing = false;
-            continue;
-        }
-
-        const auto column_default = storage_columns.getDefault(columns[i]);
-        if (!column_default)
-            continue;
-
-        /// collect identifiers required for evaluation
-        IdentifierNameSet identifiers;
-        column_default->expression->collectIdentifierNames(identifiers);
-
-        for (const auto & identifier : identifiers)
-        {
-            if (storage_columns.hasPhysical(identifier))
-            {
-                /// ensure each column is added only once
-                if (required_columns.count(identifier) == 0)
-                {
-                    columns.emplace_back(identifier);
-                    required_columns.emplace(identifier);
-                    injected_columns.emplace(identifier);
-                }
-            }
-        }
-    }
+        have_at_least_one_physical_column |= injectRequiredColumnsRecursively(
+            columns[i], storage_columns, alter_conversions,
+            part, columns, required_columns, injected_columns);
 
     /** Add a column of the minimum size.
         * Used in case when no column is needed or files are missing, but at least you need to know number of rows.
         * Adds to the columns.
         */
-    if (all_column_files_missing)
+    if (!have_at_least_one_physical_column)
     {
         const auto minimum_size_column_name = part->getColumnNameWithMinumumCompressedSize(metadata_snapshot);
         columns.push_back(minimum_size_column_name);
diff --git a/tests/queries/0_stateless/01084_defaults_on_aliases.reference b/tests/queries/0_stateless/01084_defaults_on_aliases.reference
index 9b39b07db94..6c75649efd7 100644
--- a/tests/queries/0_stateless/01084_defaults_on_aliases.reference
+++ b/tests/queries/0_stateless/01084_defaults_on_aliases.reference
@@ -1,5 +1,6 @@
 1	1
 1	1	1
+1
 2	2	4
 2	2	2	4
 3	3	9
diff --git a/tests/queries/0_stateless/01084_defaults_on_aliases.sql b/tests/queries/0_stateless/01084_defaults_on_aliases.sql
index 2e4be37cc73..2f9d8227338 100644
--- a/tests/queries/0_stateless/01084_defaults_on_aliases.sql
+++ b/tests/queries/0_stateless/01084_defaults_on_aliases.sql
@@ -2,12 +2,16 @@ DROP TABLE IF EXISTS table_with_defaults_on_aliases;
 
 CREATE TABLE table_with_defaults_on_aliases (col1 UInt32, col2 ALIAS col1, col3 DEFAULT col2) Engine = MergeTree() ORDER BY tuple();
 
+SYSTEM STOP MERGES table_with_defaults_on_aliases;
+
 INSERT INTO table_with_defaults_on_aliases (col1) VALUES (1);
 
 SELECT * FROM table_with_defaults_on_aliases WHERE col1 = 1;
 
 SELECT col1, col2, col3 FROM table_with_defaults_on_aliases WHERE col1 = 1;
 
+SELECT col3 FROM table_with_defaults_on_aliases; -- important to check without WHERE
+
 ALTER TABLE table_with_defaults_on_aliases ADD COLUMN col4 UInt64 DEFAULT col2 * col3;
 
 INSERT INTO table_with_defaults_on_aliases (col1) VALUES (2);
@@ -24,7 +28,6 @@ SELECT * FROM table_with_defaults_on_aliases WHERE col1 = 3;
 
 SELECT col1, col2, col3, col4, col5 FROM table_with_defaults_on_aliases WHERE col1 = 3;
 
-
 ALTER TABLE table_with_defaults_on_aliases ADD COLUMN col6 UInt64 MATERIALIZED col2 * col4;
 
 DROP TABLE IF EXISTS table_with_defaults_on_aliases;
diff --git a/tests/queries/0_stateless/01497_alias_on_default_array.reference b/tests/queries/0_stateless/01497_alias_on_default_array.reference
new file mode 100644
index 00000000000..8a4406e57f3
--- /dev/null
+++ b/tests/queries/0_stateless/01497_alias_on_default_array.reference
@@ -0,0 +1,6 @@
+a1	b1
+a2	b2
+a3	b3
+c1
+c2
+c3
diff --git a/tests/queries/0_stateless/01497_alias_on_default_array.sql b/tests/queries/0_stateless/01497_alias_on_default_array.sql
new file mode 100644
index 00000000000..c0c26b05eb8
--- /dev/null
+++ b/tests/queries/0_stateless/01497_alias_on_default_array.sql
@@ -0,0 +1,21 @@
+DROP TABLE IF EXISTS test_new_col;
+
+CREATE TABLE test_new_col
+(
+  `_csv` String,
+  `csv_as_array` Array(String) ALIAS splitByChar(';',_csv),
+  `csv_col1` String DEFAULT csv_as_array[1],
+  `csv_col2` String DEFAULT csv_as_array[2]
+)
+ENGINE = MergeTree
+ORDER BY tuple();
+
+INSERT INTO test_new_col (_csv) VALUES ('a1;b1;c1;d1'), ('a2;b2;c2;d2'), ('a3;b3;c3;d3');
+
+SELECT csv_col1, csv_col2 FROM test_new_col ORDER BY csv_col1;
+
+ALTER TABLE test_new_col ADD COLUMN `csv_col3` String DEFAULT csv_as_array[3];
+
+SELECT csv_col3 FROM test_new_col ORDER BY csv_col3;
+
+DROP TABLE IF EXISTS test_new_col;

From eaf5e293ad577c32d01626e2ad3111f7cb63836a Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Tue, 15 Sep 2020 14:37:51 +0300
Subject: [PATCH 239/341] Move to clang-11 in most CI builds

---
 tests/ci/ci_config.json | 68 ++++++++++++++++++++---------------------
 1 file changed, 34 insertions(+), 34 deletions(-)

diff --git a/tests/ci/ci_config.json b/tests/ci/ci_config.json
index 504b554029b..781b11a5059 100644
--- a/tests/ci/ci_config.json
+++ b/tests/ci/ci_config.json
@@ -12,7 +12,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "gcc-10",
+            "compiler": "clang-11",
             "build-type": "",
             "sanitizer": "",
             "package-type": "performance",
@@ -32,7 +32,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "",
             "sanitizer": "address",
             "package-type": "deb",
@@ -42,7 +42,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "",
             "sanitizer": "undefined",
             "package-type": "deb",
@@ -52,7 +52,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "",
             "sanitizer": "thread",
             "package-type": "deb",
@@ -62,7 +62,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "",
             "sanitizer": "memory",
             "package-type": "deb",
@@ -72,7 +72,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "",
             "sanitizer": "",
             "package-type": "deb",
@@ -82,7 +82,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "debug",
             "sanitizer": "",
             "package-type": "deb",
@@ -102,7 +102,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "",
             "sanitizer": "",
             "package-type": "binary",
@@ -112,7 +112,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "",
             "sanitizer": "",
             "package-type": "binary",
@@ -154,7 +154,7 @@
     ],
     "special_build_config": [
         {
-            "compiler": "clang-10",
+            "compiler": "clang-11",
             "build-type": "debug",
             "sanitizer": "",
             "package-type": "deb",
@@ -167,7 +167,7 @@
     "tests_config": {
         "Functional stateful tests (address)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "address",
@@ -179,7 +179,7 @@
         },
         "Functional stateful tests (thread)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "thread",
@@ -191,7 +191,7 @@
         },
         "Functional stateful tests (memory)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "memory",
@@ -203,7 +203,7 @@
         },
         "Functional stateful tests (ubsan)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "undefined",
@@ -215,7 +215,7 @@
         },
         "Functional stateful tests (debug)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "debug",
                 "sanitizer": "none",
@@ -251,7 +251,7 @@
         },
         "Functional stateless tests (address)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "address",
@@ -263,7 +263,7 @@
         },
         "Functional stateless tests (thread)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "thread",
@@ -275,7 +275,7 @@
         },
         "Functional stateless tests (memory)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "memory",
@@ -287,7 +287,7 @@
         },
         "Functional stateless tests (ubsan)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "undefined",
@@ -299,7 +299,7 @@
         },
         "Functional stateless tests (debug)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "debug",
                 "sanitizer": "none",
@@ -359,7 +359,7 @@
         },
         "Stress test (address)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "address",
@@ -371,7 +371,7 @@
         },
         "Stress test (thread)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "thread",
@@ -383,7 +383,7 @@
         },
         "Stress test (undefined)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "undefined",
@@ -395,7 +395,7 @@
         },
         "Stress test (memory)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "memory",
@@ -407,7 +407,7 @@
         },
         "Integration tests (asan)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "address",
@@ -419,7 +419,7 @@
         },
         "Integration tests (thread)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "thread",
@@ -431,7 +431,7 @@
         },
         "Integration tests (release)": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -455,7 +455,7 @@
         },
         "Split build smoke test": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "binary",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -491,7 +491,7 @@
         },
         "Unit tests release clang": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "binary",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",
@@ -503,7 +503,7 @@
         },
         "Unit tests ASAN": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "binary",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "address",
@@ -515,7 +515,7 @@
         },
         "Unit tests MSAN": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "binary",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "memory",
@@ -527,7 +527,7 @@
         },
         "Unit tests TSAN": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "binary",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "thread",
@@ -539,7 +539,7 @@
         },
         "Unit tests UBSAN": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "binary",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "thread",
@@ -551,7 +551,7 @@
         },
         "AST fuzzer": {
             "required_build_properties": {
-                "compiler": "clang-10",
+                "compiler": "clang-11",
                 "package_type": "binary",
                 "build_type": "debug",
                 "sanitizer": "none",

From 7fc09b930e99ec5213aec55e2515937fbe092fd0 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Tue, 15 Sep 2020 15:16:23 +0300
Subject: [PATCH 240/341] Clang 11 in binary build

---
 docker/packager/binary/Dockerfile | 13 ++++++-------
 1 file changed, 6 insertions(+), 7 deletions(-)

diff --git a/docker/packager/binary/Dockerfile b/docker/packager/binary/Dockerfile
index 03bb3b5aefa..b563da04875 100644
--- a/docker/packager/binary/Dockerfile
+++ b/docker/packager/binary/Dockerfile
@@ -11,7 +11,7 @@ RUN apt-get update \
     && echo "${LLVM_PUBKEY_HASH} /tmp/llvm-snapshot.gpg.key" | sha384sum -c \
     && apt-key add /tmp/llvm-snapshot.gpg.key \
     && export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
-    && echo "deb [trusted=yes] http://apt.llvm.org/${CODENAME}/ llvm-toolchain-${CODENAME}-${LLVM_VERSION} main" >> \
+    && echo "deb [trusted=yes] http://apt.llvm.org/${CODENAME}/ llvm-toolchain-${CODENAME}-11 main" >> \
         /etc/apt/sources.list
 
 # initial packages
@@ -36,12 +36,11 @@ RUN apt-get update \
         clang-${LLVM_VERSION} \
         lld-${LLVM_VERSION} \
         clang-tidy-${LLVM_VERSION} \
-        clang-9 \
-        lld-9 \
-        clang-tidy-9 \
-        clang-8 \
-        lld-8 \
-        clang-tidy-8 \
+        clang-11 \
+        clang-tidy-11 \
+        lld-11 \
+        llvm-11 \
+        llvm-11-dev \
         libicu-dev \
         libreadline-dev \
         ninja-build \

From 106e05ab2f36e7222be3ef5af8ae156502480dba Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Tue, 15 Sep 2020 20:28:42 +0800
Subject: [PATCH 241/341] Try fix mysql protocol parse failure

---
 src/Core/MySQL/MySQLReplication.cpp           | 92 ++++++++++---------
 src/Core/MySQL/MySQLReplication.h             |  2 +-
 src/IO/MySQLBinlogEventReadBuffer.cpp         | 61 ++++++++++++
 src/IO/MySQLBinlogEventReadBuffer.h           | 26 ++++++
 .../gtest_mysql_binlog_event_read_buffer.cpp  | 20 ++++
 src/IO/ya.make                                |  1 +
 6 files changed, 160 insertions(+), 42 deletions(-)
 create mode 100644 src/IO/MySQLBinlogEventReadBuffer.cpp
 create mode 100644 src/IO/MySQLBinlogEventReadBuffer.h
 create mode 100644 src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp

diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index e7f113ba7af..81d46d10025 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -2,6 +2,7 @@
 
 #include <DataTypes/DataTypeString.h>
 #include <IO/ReadBufferFromString.h>
+#include <IO/MySQLBinlogEventReadBuffer.h>
 #include <IO/ReadHelpers.h>
 #include <common/DateLUT.h>
 #include <Common/FieldVisitors.h>
@@ -100,9 +101,7 @@ namespace MySQLReplication
         payload.readStrict(reinterpret_cast<char *>(schema.data()), schema_len);
         payload.ignore(1);
 
-        size_t len = payload.available() - CHECKSUM_CRC32_SIGNATURE_LENGTH;
-        query.resize(len);
-        payload.readStrict(reinterpret_cast<char *>(query.data()), len);
+        readStringUntilEOF(query, payload);
         if (query.starts_with("BEGIN") || query.starts_with("COMMIT"))
         {
             typ = QUERY_EVENT_MULTI_TXN_FLAG;
@@ -285,7 +284,7 @@ namespace MySQLReplication
                 break;
         }
 
-        while (payload.available() > CHECKSUM_CRC32_SIGNATURE_LENGTH)
+        while (!payload.eof())
         {
             parseRow(payload, columns_present_bitmap1);
             if (header.type == UPDATE_ROWS_EVENT_V1 || header.type == UPDATE_ROWS_EVENT_V2)
@@ -738,7 +737,7 @@ namespace MySQLReplication
         payload.readStrict(reinterpret_cast<char *>(&gtid.seq_no), 8);
 
         /// Skip others.
-        payload.ignore(payload.available() - CHECKSUM_CRC32_SIGNATURE_LENGTH);
+        payload.ignoreAll();
     }
 
     void GTIDEvent::dump(std::ostream & out) const
@@ -804,46 +803,51 @@ namespace MySQLReplication
 
     void MySQLFlavor::readPayloadImpl(ReadBuffer & payload)
     {
-        UInt16 header = static_cast<unsigned char>(*payload.position());
+        MySQLBinlogEventReadBuffer event_payload(payload);
+        UInt16 header = static_cast<unsigned char>(*event_payload.position());
         switch (header)
         {
             case PACKET_EOF:
                 throw ReplicationError("Master maybe lost", ErrorCodes::UNKNOWN_EXCEPTION);
             case PACKET_ERR:
                 ERRPacket err;
-                err.readPayloadWithUnpacked(payload);
+                err.readPayloadWithUnpacked(event_payload);
                 throw ReplicationError(err.error_message, ErrorCodes::UNKNOWN_EXCEPTION);
         }
         // skip the header flag.
-        payload.ignore(1);
+        event_payload.ignore(1);
 
-        EventType event_type = static_cast<EventType>(*(payload.position() + 4));
+        EventType event_type = static_cast<EventType>(*(event_payload.position() + 4));
         switch (event_type)
         {
-            case FORMAT_DESCRIPTION_EVENT: {
+            case FORMAT_DESCRIPTION_EVENT:
+            {
                 event = std::make_shared<FormatDescriptionEvent>();
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 position.update(event);
                 break;
             }
-            case ROTATE_EVENT: {
+            case ROTATE_EVENT:
+            {
                 event = std::make_shared<RotateEvent>();
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 position.update(event);
                 break;
             }
-            case QUERY_EVENT: {
+            case QUERY_EVENT:
+            {
                 event = std::make_shared<QueryEvent>();
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
 
                 auto query = std::static_pointer_cast<QueryEvent>(event);
                 switch (query->typ)
                 {
                     case QUERY_EVENT_MULTI_TXN_FLAG:
-                    case QUERY_EVENT_XA: {
+                    case QUERY_EVENT_XA:
+                    {
                         event = std::make_shared<DryRunEvent>();
                         break;
                     }
@@ -852,68 +856,74 @@ namespace MySQLReplication
                 }
                 break;
             }
-            case XID_EVENT: {
+            case XID_EVENT:
+            {
                 event = std::make_shared<XIDEvent>();
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 position.update(event);
                 break;
             }
-            case TABLE_MAP_EVENT: {
+            case TABLE_MAP_EVENT:
+            {
                 event = std::make_shared<TableMapEvent>();
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 table_map = std::static_pointer_cast<TableMapEvent>(event);
                 break;
             }
             case WRITE_ROWS_EVENT_V1:
-            case WRITE_ROWS_EVENT_V2: {
+            case WRITE_ROWS_EVENT_V2:
+            {
                 if (do_replicate())
                     event = std::make_shared<WriteRowsEvent>(table_map);
                 else
                     event = std::make_shared<DryRunEvent>();
 
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 break;
             }
             case DELETE_ROWS_EVENT_V1:
-            case DELETE_ROWS_EVENT_V2: {
+            case DELETE_ROWS_EVENT_V2:
+            {
                 if (do_replicate())
                     event = std::make_shared<DeleteRowsEvent>(table_map);
                 else
                     event = std::make_shared<DryRunEvent>();
 
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 break;
             }
             case UPDATE_ROWS_EVENT_V1:
-            case UPDATE_ROWS_EVENT_V2: {
+            case UPDATE_ROWS_EVENT_V2:
+            {
                 if (do_replicate())
                     event = std::make_shared<UpdateRowsEvent>(table_map);
                 else
                     event = std::make_shared<DryRunEvent>();
 
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 break;
             }
-            case GTID_EVENT: {
+            case GTID_EVENT:
+            {
                 event = std::make_shared<GTIDEvent>();
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 position.update(event);
                 break;
             }
-            default: {
+            default:
+            {
                 event = std::make_shared<DryRunEvent>();
-                event->parseHeader(payload);
-                event->parseEvent(payload);
+                event->parseHeader(event_payload);
+                event->parseEvent(event_payload);
                 break;
             }
         }
-        payload.ignoreAll();
     }
 }
 
diff --git a/src/Core/MySQL/MySQLReplication.h b/src/Core/MySQL/MySQLReplication.h
index b63b103e87a..230055902e5 100644
--- a/src/Core/MySQL/MySQLReplication.h
+++ b/src/Core/MySQL/MySQLReplication.h
@@ -505,7 +505,7 @@ namespace MySQLReplication
     class MySQLFlavor : public IFlavor
     {
     public:
-        void readPayloadImpl(ReadBuffer & payload) override;
+        void readPayloadImpl(ReadBuffer & event_payload) override;
         String getName() const override { return "MySQL"; }
         Position getPosition() const override { return position; }
         BinlogEventPtr readOneEvent() override { return event; }
diff --git a/src/IO/MySQLBinlogEventReadBuffer.cpp b/src/IO/MySQLBinlogEventReadBuffer.cpp
new file mode 100644
index 00000000000..3b76efa64ac
--- /dev/null
+++ b/src/IO/MySQLBinlogEventReadBuffer.cpp
@@ -0,0 +1,61 @@
+#include <IO/MySQLBinlogEventReadBuffer.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+MySQLBinlogEventReadBuffer::MySQLBinlogEventReadBuffer(ReadBuffer & in_)
+    : ReadBuffer(nullptr, 0, 0), in(in_)
+{
+}
+
+bool MySQLBinlogEventReadBuffer::nextImpl()
+{
+    if (hasPendingData())
+        return true;
+
+    if (in.eof())
+        return false;
+
+    if (likely(in.available() > CHECKSUM_CRC32_SIGNATURE_LENGTH))
+    {
+        working_buffer = ReadBuffer::Buffer(in.position(), in.buffer().end() - CHECKSUM_CRC32_SIGNATURE_LENGTH);
+        in.ignore(working_buffer.size());
+        return true;
+    }
+
+    if (checksum_buff_size == checksum_buff_limit)
+    {
+        in.readStrict(checksum_buf, CHECKSUM_CRC32_SIGNATURE_LENGTH);
+        checksum_buff_size = checksum_buff_limit = CHECKSUM_CRC32_SIGNATURE_LENGTH;
+    }
+    else
+    {
+        for (size_t index = 0; index < checksum_buff_size - checksum_buff_limit; ++index)
+            checksum_buf[index] = checksum_buf[checksum_buff_limit + index];
+
+        checksum_buff_size -= checksum_buff_limit;
+        size_t read_bytes = CHECKSUM_CRC32_SIGNATURE_LENGTH - checksum_buff_size;
+        in.readStrict(checksum_buf + checksum_buff_size, read_bytes);   /// Minimum CHECKSUM_CRC32_SIGNATURE_LENGTH bytes
+        checksum_buff_size = checksum_buff_limit = CHECKSUM_CRC32_SIGNATURE_LENGTH;
+    }
+
+    if (in.eof())
+        return false;
+
+    if (in.available() < CHECKSUM_CRC32_SIGNATURE_LENGTH)
+    {
+        size_t left_move_size = CHECKSUM_CRC32_SIGNATURE_LENGTH - in.available();
+        checksum_buff_limit = checksum_buff_size - left_move_size;
+    }
+
+    working_buffer = ReadBuffer::Buffer(checksum_buf, checksum_buf + checksum_buff_limit);
+    return true;
+}
+
+}
diff --git a/src/IO/MySQLBinlogEventReadBuffer.h b/src/IO/MySQLBinlogEventReadBuffer.h
new file mode 100644
index 00000000000..7a19461e57e
--- /dev/null
+++ b/src/IO/MySQLBinlogEventReadBuffer.h
@@ -0,0 +1,26 @@
+#pragma once
+
+#include <IO/ReadBuffer.h>
+
+namespace DB
+{
+
+class MySQLBinlogEventReadBuffer : public ReadBuffer
+{
+protected:
+    static const size_t CHECKSUM_CRC32_SIGNATURE_LENGTH = 4;
+    ReadBuffer & in;
+
+    size_t checksum_buff_size = 0;
+    size_t checksum_buff_limit = 0;
+    char checksum_buf[CHECKSUM_CRC32_SIGNATURE_LENGTH];
+
+    bool nextImpl() override;
+
+public:
+    MySQLBinlogEventReadBuffer(ReadBuffer & in_);
+
+};
+
+
+}
diff --git a/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp b/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
new file mode 100644
index 00000000000..183da5182af
--- /dev/null
+++ b/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
@@ -0,0 +1,20 @@
+#include <gtest/gtest.h>
+#include <Common/Exception.h>
+#include <IO/ReadBufferFromMemory.h>
+#include <IO/MySQLBinlogEventReadBuffer.h>
+
+using namespace DB;
+
+TEST(MySQLBinlogEventReadBuffer, CheckBoundary)
+{
+    for (size_t index = 1; index < 4; ++index)
+    {
+        std::vector<char> memory_data(index, 0x01);
+        ReadBufferFromMemory nested_in(memory_data.data(), index);
+
+        MySQLBinlogEventReadBuffer binlog_in(nested_in);
+        EXPECT_THROW(binlog_in.ignore(), Exception);
+    }
+}
+
+
diff --git a/src/IO/ya.make b/src/IO/ya.make
index 0c939588a9b..28099818b46 100644
--- a/src/IO/ya.make
+++ b/src/IO/ya.make
@@ -28,6 +28,7 @@ SRCS(
     MemoryReadWriteBuffer.cpp
     MMapReadBufferFromFile.cpp
     MMapReadBufferFromFileDescriptor.cpp
+    MySQLBinlogEventReadBuffer.cpp
     MySQLPacketPayloadReadBuffer.cpp
     MySQLPacketPayloadWriteBuffer.cpp
     NullWriteBuffer.cpp

From e20c54998c955014dbc032795e00949a141c6c7f Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Tue, 15 Sep 2020 16:29:11 +0300
Subject: [PATCH 242/341] Better exception on non physical columns

---
 src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp | 11 +++++++++--
 1 file changed, 9 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp b/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
index 41610efafa5..147ac070efb 100644
--- a/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
+++ b/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
@@ -10,14 +10,15 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
+    extern const int NO_SUCH_COLUMN_IN_TABLE;
 }
 
 namespace
 {
 
 /// Columns absent in part may depend on other absent columns so we are
-/// searching all required columns recursively. Return true if found at least
-/// one existing column in part.
+/// searching all required physical columns recursively. Return true if found at
+/// least one existing (physical) column in part.
 bool injectRequiredColumnsRecursively(
     const String & column_name,
     const ColumnsDescription & storage_columns,
@@ -73,9 +74,15 @@ NameSet injectRequiredColumns(const MergeTreeData & storage, const StorageMetada
     const auto & storage_columns = metadata_snapshot->getColumns();
     auto alter_conversions = storage.getAlterConversionsForPart(part);
     for (size_t i = 0; i < columns.size(); ++i)
+    {
+        /// We are going to fetch only physical columns
+        if (!storage_columns.hasPhysical(columns[i]))
+            throw Exception("There is no physical column " + columns[i] + " in table.", ErrorCodes::NO_SUCH_COLUMN_IN_TABLE);
+
         have_at_least_one_physical_column |= injectRequiredColumnsRecursively(
             columns[i], storage_columns, alter_conversions,
             part, columns, required_columns, injected_columns);
+    }
 
     /** Add a column of the minimum size.
         * Used in case when no column is needed or files are missing, but at least you need to know number of rows.

From 69b02c7500a732d2e705911fdbb7abed7c97d51e Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 15 Sep 2020 16:35:04 +0300
Subject: [PATCH 243/341] Remove space.

---
 src/Functions/GatherUtils/Algorithms.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index 769d23b66dc..32501beebf0 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -21,7 +21,6 @@ namespace DB::GatherUtils
 
 inline constexpr size_t MAX_ARRAY_SIZE = 1 << 30;
 
-
 /// Methods to copy Slice to Sink, overloaded for various combinations of types.
 
 template <typename T>

From 84c68947b947a382b5424a4f6713b34b12072aec Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Tue, 15 Sep 2020 22:07:03 +0800
Subject: [PATCH 244/341] Add test for MySQLBinlogReadBuffer

---
 .../gtest_mysql_binlog_event_read_buffer.cpp  | 38 +++++++++++++++++++
 1 file changed, 38 insertions(+)

diff --git a/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp b/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
index 183da5182af..fe16a13085e 100644
--- a/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
+++ b/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
@@ -1,5 +1,6 @@
 #include <gtest/gtest.h>
 #include <Common/Exception.h>
+#include <IO/ConcatReadBuffer.h>
 #include <IO/ReadBufferFromMemory.h>
 #include <IO/MySQLBinlogEventReadBuffer.h>
 
@@ -17,4 +18,41 @@ TEST(MySQLBinlogEventReadBuffer, CheckBoundary)
     }
 }
 
+TEST(MySQLBinlogEventReadBuffer, NiceBufferSize)
+{
+    char res[2];
+    std::vector<char> memory_data(6, 0x01);
+    ReadBufferFromMemory nested_in(memory_data.data(), 6);
+
+    MySQLBinlogEventReadBuffer binlog_in(nested_in);
+    binlog_in.readStrict(res, 2);
+    ASSERT_EQ(res[0], 0x01);
+    ASSERT_EQ(res[1], 0x01);
+    ASSERT_TRUE(binlog_in.eof());
+}
+
+TEST(MySQLBinlogEventReadBuffer, BadBufferSizes)
+{
+    char res[4];
+    std::vector<ReadBufferPtr> buffers;
+    std::vector<ReadBuffer *> nested_buffers;
+    std::vector<std::shared_ptr<std::vector<char>>> memory_buffers_data;
+    std::vector<size_t> bad_buffers_size = {2, 1, 2, 3};
+
+    for (const auto & bad_buffer_size : bad_buffers_size)
+    {
+        memory_buffers_data.emplace_back(std::make_shared<std::vector<char>>(bad_buffer_size, 0x01));
+        buffers.emplace_back(std::make_shared<ReadBufferFromMemory>(memory_buffers_data.back()->data(), bad_buffer_size));
+        nested_buffers.emplace_back(buffers.back().get());
+    }
+
+    ConcatReadBuffer concat_buffer(nested_buffers);
+    MySQLBinlogEventReadBuffer binlog_in(concat_buffer);
+    binlog_in.readStrict(res, 4);
+    ASSERT_EQ(res[0], 0x01);
+    ASSERT_EQ(res[1], 0x01);
+    ASSERT_EQ(res[2], 0x01);
+    ASSERT_EQ(res[3], 0x01);
+    ASSERT_TRUE(binlog_in.eof());
+}
 

From 11fb25515551103158c1150438d3377a8b0dd7aa Mon Sep 17 00:00:00 2001
From: Denis Zhuravlev <deniszhuravlov@gmail.com>
Date: Tue, 15 Sep 2020 11:11:34 -0300
Subject: [PATCH 245/341] Update ext-dict-functions.md

---
 docs/en/sql-reference/functions/ext-dict-functions.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/functions/ext-dict-functions.md b/docs/en/sql-reference/functions/ext-dict-functions.md
index e0ecdd74fad..99805f5b55c 100644
--- a/docs/en/sql-reference/functions/ext-dict-functions.md
+++ b/docs/en/sql-reference/functions/ext-dict-functions.md
@@ -189,8 +189,8 @@ dictGet[Type]OrDefault('dict_name', 'attr_name', id_expr, default_value_expr)
 
 -   `dict_name` — Name of the dictionary. [String literal](../../sql-reference/syntax.md#syntax-string-literal).
 -   `attr_name` — Name of the column of the dictionary. [String literal](../../sql-reference/syntax.md#syntax-string-literal).
--   `id_expr` — Key value. [Expression](../../sql-reference/syntax.md#syntax-expressions) returning a [UInt64](../../sql-reference/data-types/int-uint.md)-type value.
--   `default_value_expr` — Value which is returned if the dictionary doesn’t contain a row with the `id_expr` key. [Expression](../../sql-reference/syntax.md#syntax-expressions) returning a value in the data type configured for the `attr_name` attribute.
+-   `id_expr` — Key value. [Expression](../../sql-reference/syntax.md#syntax-expressions) returning a [UInt64](../../sql-reference/data-types/int-uint.md) or [Tuple](../../sql-reference/data-types/tuple.md)-type value depending on the dictionary configuration.
+-   `default_value_expr` — Value returned if the dictionary doesn’t contain a row with the `id_expr` key. [Expression](../../sql-reference/syntax.md#syntax-expressions) returning the value in the data type configured for the `attr_name` attribute.
 
 **Returned value**
 

From 8ed698e1dcbebdab5548e46fc0441c2ed20483d5 Mon Sep 17 00:00:00 2001
From: Denis Zhuravlev <deniszhuravlov@gmail.com>
Date: Tue, 15 Sep 2020 11:14:51 -0300
Subject: [PATCH 246/341] Update ext-dict-functions.md

---
 docs/ru/sql-reference/functions/ext-dict-functions.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/ru/sql-reference/functions/ext-dict-functions.md b/docs/ru/sql-reference/functions/ext-dict-functions.md
index a260ec1e16e..792afd1775d 100644
--- a/docs/ru/sql-reference/functions/ext-dict-functions.md
+++ b/docs/ru/sql-reference/functions/ext-dict-functions.md
@@ -103,7 +103,7 @@ dictHas('dict_name', id)
 **Параметры**
 
 -   `dict_name` — имя словаря. [Строковый литерал](../syntax.md#syntax-string-literal).
--   `id_expr` — значение ключа словаря. [Выражение](../syntax.md#syntax-expressions), возвращающее значение типа [UInt64](../../sql-reference/functions/ext-dict-functions.md).
+-   `id_expr` — значение ключа словаря. [Выражение](../syntax.md#syntax-expressions), возвращающее значение типа [UInt64](../../sql-reference/functions/ext-dict-functions.md) или [Tuple](../../sql-reference/functions/ext-dict-functions.md) в зависимости от конфигурации словаря.
 
 **Возвращаемое значение**
 
@@ -179,7 +179,7 @@ dictGet[Type]OrDefault('dict_name', 'attr_name', id_expr, default_value_expr)
 
 -   `dict_name` — имя словаря. [Строковый литерал](../syntax.md#syntax-string-literal).
 -   `attr_name` — имя столбца словаря. [Строковый литерал](../syntax.md#syntax-string-literal).
--   `id_expr` — значение ключа словаря. [Выражение](../syntax.md#syntax-expressions), возвращающее значение типа [UInt64](../../sql-reference/functions/ext-dict-functions.md).
+-   `id_expr` — значение ключа словаря. [Выражение](../syntax.md#syntax-expressions), возвращающее значение типа [UInt64](../../sql-reference/functions/ext-dict-functions.md) или [Tuple](../../sql-reference/functions/ext-dict-functions.md) в зависимости от конфигурации словаря.
 -   `default_value_expr` — значение, возвращаемое в том случае, когда словарь не содержит строки с заданным ключом `id_expr`. [Выражение](../syntax.md#syntax-expressions) возвращающее значение с типом данных, сконфигурированным для атрибута `attr_name`.
 
 **Возвращаемое значение**

From c4a90a9bc9c01f05fcc28a778adcc6b75043e8a8 Mon Sep 17 00:00:00 2001
From: Denis Zhuravlev <deniszhuravlov@gmail.com>
Date: Tue, 15 Sep 2020 11:15:30 -0300
Subject: [PATCH 247/341] Update ext-dict-functions.md

---
 docs/en/sql-reference/functions/ext-dict-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/ext-dict-functions.md b/docs/en/sql-reference/functions/ext-dict-functions.md
index 99805f5b55c..7df6ef54f2a 100644
--- a/docs/en/sql-reference/functions/ext-dict-functions.md
+++ b/docs/en/sql-reference/functions/ext-dict-functions.md
@@ -111,7 +111,7 @@ dictHas('dict_name', id_expr)
 **Parameters**
 
 -   `dict_name` — Name of the dictionary. [String literal](../../sql-reference/syntax.md#syntax-string-literal).
--   `id_expr` — Key value. [Expression](../../sql-reference/syntax.md#syntax-expressions) returning a [UInt64](../../sql-reference/data-types/int-uint.md)-type value.
+-   `id_expr` — Key value. [Expression](../../sql-reference/syntax.md#syntax-expressions) returning a [UInt64](../../sql-reference/data-types/int-uint.md) or [Tuple](../../sql-reference/data-types/tuple.md)-type value depending on the dictionary configuration.
 
 **Returned value**
 

From fb92c56beb688b6cfb0bed91ee33f5e5fae9e930 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Tue, 15 Sep 2020 22:22:23 +0800
Subject: [PATCH 248/341] Fix bad and nice buffer size

---
 src/IO/MySQLBinlogEventReadBuffer.cpp         | 14 ++++----
 .../gtest_mysql_binlog_event_read_buffer.cpp  | 33 ++++++++++++++++---
 2 files changed, 36 insertions(+), 11 deletions(-)

diff --git a/src/IO/MySQLBinlogEventReadBuffer.cpp b/src/IO/MySQLBinlogEventReadBuffer.cpp
index 3b76efa64ac..2fd8fdca171 100644
--- a/src/IO/MySQLBinlogEventReadBuffer.cpp
+++ b/src/IO/MySQLBinlogEventReadBuffer.cpp
@@ -22,15 +22,15 @@ bool MySQLBinlogEventReadBuffer::nextImpl()
     if (in.eof())
         return false;
 
-    if (likely(in.available() > CHECKSUM_CRC32_SIGNATURE_LENGTH))
-    {
-        working_buffer = ReadBuffer::Buffer(in.position(), in.buffer().end() - CHECKSUM_CRC32_SIGNATURE_LENGTH);
-        in.ignore(working_buffer.size());
-        return true;
-    }
-
     if (checksum_buff_size == checksum_buff_limit)
     {
+        if (likely(in.available() > CHECKSUM_CRC32_SIGNATURE_LENGTH))
+        {
+            working_buffer = ReadBuffer::Buffer(in.position(), in.buffer().end() - CHECKSUM_CRC32_SIGNATURE_LENGTH);
+            in.ignore(working_buffer.size());
+            return true;
+        }
+
         in.readStrict(checksum_buf, CHECKSUM_CRC32_SIGNATURE_LENGTH);
         checksum_buff_size = checksum_buff_limit = CHECKSUM_CRC32_SIGNATURE_LENGTH;
     }
diff --git a/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp b/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
index fe16a13085e..66077bcba5b 100644
--- a/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
+++ b/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
@@ -49,10 +49,35 @@ TEST(MySQLBinlogEventReadBuffer, BadBufferSizes)
     ConcatReadBuffer concat_buffer(nested_buffers);
     MySQLBinlogEventReadBuffer binlog_in(concat_buffer);
     binlog_in.readStrict(res, 4);
-    ASSERT_EQ(res[0], 0x01);
-    ASSERT_EQ(res[1], 0x01);
-    ASSERT_EQ(res[2], 0x01);
-    ASSERT_EQ(res[3], 0x01);
+
+    for (size_t index = 0; index < 4; ++index)
+        ASSERT_EQ(res[index], 0x01);
+
+    ASSERT_TRUE(binlog_in.eof());
+}
+
+TEST(MySQLBinlogEventReadBuffer, NiceAndBadBufferSizes)
+{
+    char res[12];
+    std::vector<ReadBufferPtr> buffers;
+    std::vector<ReadBuffer *> nested_buffers;
+    std::vector<std::shared_ptr<std::vector<char>>> memory_buffers_data;
+    std::vector<size_t> buffers_size = {6, 1, 3, 6};
+
+    for (const auto & bad_buffer_size : buffers_size)
+    {
+        memory_buffers_data.emplace_back(std::make_shared<std::vector<char>>(bad_buffer_size, 0x01));
+        buffers.emplace_back(std::make_shared<ReadBufferFromMemory>(memory_buffers_data.back()->data(), bad_buffer_size));
+        nested_buffers.emplace_back(buffers.back().get());
+    }
+
+    ConcatReadBuffer concat_buffer(nested_buffers);
+    MySQLBinlogEventReadBuffer binlog_in(concat_buffer);
+    binlog_in.readStrict(res, 12);
+
+    for (size_t index = 0; index < 12; ++index)
+        ASSERT_EQ(res[index], 0x01);
+
     ASSERT_TRUE(binlog_in.eof());
 }
 

From 1c659de8b1a2fa4d2adb96b5302ba657a0c2319f Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Tue, 15 Sep 2020 22:44:18 +0800
Subject: [PATCH 249/341] ISSUES-14809 fix MaterializeMySQL empty transaction
 test failure

---
 .../test_materialize_mysql_database/materialize_with_ddl.py   | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_materialize_mysql_database/materialize_with_ddl.py b/tests/integration/test_materialize_mysql_database/materialize_with_ddl.py
index 37e204aae48..dbf86044583 100644
--- a/tests/integration/test_materialize_mysql_database/materialize_with_ddl.py
+++ b/tests/integration/test_materialize_mysql_database/materialize_with_ddl.py
@@ -350,7 +350,7 @@ def query_event_with_empty_transaction(clickhouse_node, mysql_node, service_name
     mysql_node.query("INSERT INTO test_database.t1(a) VALUES(2)")
     mysql_node.query("/* start */ commit /* end */")
 
-    check_query(clickhouse_node, "SELECT * FROM test_database.t1 ORDER BY a FORMAT TSV",
-                "1\tBEGIN\n2\tBEGIN\n")
+    check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "t1\n")
+    check_query(clickhouse_node, "SELECT * FROM test_database.t1 ORDER BY a FORMAT TSV", "1\tBEGIN\n2\tBEGIN\n")
     clickhouse_node.query("DROP DATABASE test_database")
     mysql_node.query("DROP DATABASE test_database")

From 6130cd73658d83d358b75b9ff4f7081fddb71b6a Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Tue, 15 Sep 2020 17:53:55 +0300
Subject: [PATCH 250/341] More stable test_no_ttl_merges_in_busy_pool

---
 tests/integration/test_concurrent_ttl_merges/test.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_concurrent_ttl_merges/test.py b/tests/integration/test_concurrent_ttl_merges/test.py
index 1ca303a6dcc..f1704a80710 100644
--- a/tests/integration/test_concurrent_ttl_merges/test.py
+++ b/tests/integration/test_concurrent_ttl_merges/test.py
@@ -71,11 +71,16 @@ def test_no_ttl_merges_in_busy_pool(started_cluster):
 
     node1.query("SYSTEM START TTL MERGES")
 
+    rows_count = []
     while count_running_mutations(node1, "test_ttl") == 6:
         print "Mutations count after start TTL", count_running_mutations(node1, "test_ttl")
-        assert node1.query("SELECT count() FROM test_ttl") == "30\n"
+        rows_count.append(int(node1.query("SELECT count() FROM test_ttl").strip()))
         time.sleep(0.5)
 
+    # at least several seconds we didn't run any TTL merges and rows count equal
+    # to the original value
+    assert sum([1 for count in rows_count if count == 30]) > 4
+
     assert_eq_with_retry(node1, "SELECT COUNT() FROM test_ttl", "0")
 
 
From 9c329996ffbf1f21c55dccc970d58d41ed50d6b8 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Tue, 15 Sep 2020 22:56:57 +0800
Subject: [PATCH 251/341] Revert param name in header file

---
 src/Core/MySQL/MySQLReplication.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/MySQL/MySQLReplication.h b/src/Core/MySQL/MySQLReplication.h
index 12ed67633b0..ad5e53ed200 100644
--- a/src/Core/MySQL/MySQLReplication.h
+++ b/src/Core/MySQL/MySQLReplication.h
@@ -505,7 +505,7 @@ namespace MySQLReplication
     class MySQLFlavor : public IFlavor
     {
     public:
-        void readPayloadImpl(ReadBuffer & event_payload) override;
+        void readPayloadImpl(ReadBuffer & payload) override;
         String getName() const override { return "MySQL"; }
         Position getPosition() const override { return position; }
         BinlogEventPtr readOneEvent() override { return event; }

From 30352f096dcae6792320a620e957ee6da333dcd2 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Tue, 15 Sep 2020 22:59:21 +0800
Subject: [PATCH 252/341] Init buffer in constructor

---
 src/IO/MySQLBinlogEventReadBuffer.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/IO/MySQLBinlogEventReadBuffer.cpp b/src/IO/MySQLBinlogEventReadBuffer.cpp
index 2fd8fdca171..0680e075af9 100644
--- a/src/IO/MySQLBinlogEventReadBuffer.cpp
+++ b/src/IO/MySQLBinlogEventReadBuffer.cpp
@@ -12,6 +12,7 @@ namespace ErrorCodes
 MySQLBinlogEventReadBuffer::MySQLBinlogEventReadBuffer(ReadBuffer & in_)
     : ReadBuffer(nullptr, 0, 0), in(in_)
 {
+    nextIfAtEnd();
 }
 
 bool MySQLBinlogEventReadBuffer::nextImpl()

From 813a6e991cc278fc9510d24efe0aa9b1a000cb3b Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Tue, 15 Sep 2020 18:16:29 +0300
Subject: [PATCH 253/341] Remove wait_for_mutation from test

---
 .../0_stateless/00652_replicated_mutations_zookeeper.sh  | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/tests/queries/0_stateless/00652_replicated_mutations_zookeeper.sh b/tests/queries/0_stateless/00652_replicated_mutations_zookeeper.sh
index b8884df92ba..af2bf2dca2b 100755
--- a/tests/queries/0_stateless/00652_replicated_mutations_zookeeper.sh
+++ b/tests/queries/0_stateless/00652_replicated_mutations_zookeeper.sh
@@ -28,15 +28,12 @@ ${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_r1 DELETE WHERE d = '11'" 2>
 # Delete some values
 ${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_r1 DELETE WHERE x % 2 = 1"
 ${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_r1 DELETE WHERE s = 'd'"
-${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_r1 DELETE WHERE m = 3"
+${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_r1 DELETE WHERE m = 3 SETTINGS mutations_sync = 2"
 
 # Insert more data
 ${CLICKHOUSE_CLIENT} --query="INSERT INTO mutations_r1(d, x, s) VALUES \
     ('2000-01-01', 5, 'e'), ('2000-02-01', 5, 'e')"
 
-# Wait until the last mutation is done.
-wait_for_mutation "mutations_r2" "0000000003"
-
 # Check that the table contains only the data that should not be deleted.
 ${CLICKHOUSE_CLIENT} --query="SELECT d, x, s, m FROM mutations_r2 ORDER BY d, x"
 # Check the contents of the system.mutations table.
@@ -65,9 +62,7 @@ ${CLICKHOUSE_CLIENT} --query="INSERT INTO mutations_cleaner_r1(x) VALUES (1), (2
 # Add some mutations and wait for their execution
 ${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_cleaner_r1 DELETE WHERE x = 1"
 ${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_cleaner_r1 DELETE WHERE x = 2"
-${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_cleaner_r1 DELETE WHERE x = 3"
-
-wait_for_mutation "mutations_cleaner_r2" "0000000002"
+${CLICKHOUSE_CLIENT} --query="ALTER TABLE mutations_cleaner_r1 DELETE WHERE x = 3 SETTINGS mutations_sync = 2"
 
 # Add another mutation and prevent its execution on the second replica
 ${CLICKHOUSE_CLIENT} --query="SYSTEM STOP REPLICATION QUEUES mutations_cleaner_r2"

From 0c06ccc35ea9df6fd0859ec5bec5f5a51bcdf0f7 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Tue, 15 Sep 2020 23:26:13 +0800
Subject: [PATCH 254/341] Fix parse error packet on event

---
 src/Core/MySQL/MySQLReplication.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index 81d46d10025..a46d787b225 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -803,20 +803,20 @@ namespace MySQLReplication
 
     void MySQLFlavor::readPayloadImpl(ReadBuffer & payload)
     {
-        MySQLBinlogEventReadBuffer event_payload(payload);
-        UInt16 header = static_cast<unsigned char>(*event_payload.position());
+        UInt16 header = static_cast<unsigned char>(*payload.position());
         switch (header)
         {
             case PACKET_EOF:
                 throw ReplicationError("Master maybe lost", ErrorCodes::UNKNOWN_EXCEPTION);
             case PACKET_ERR:
                 ERRPacket err;
-                err.readPayloadWithUnpacked(event_payload);
+                err.readPayloadWithUnpacked(payload);
                 throw ReplicationError(err.error_message, ErrorCodes::UNKNOWN_EXCEPTION);
         }
         // skip the header flag.
-        event_payload.ignore(1);
+        payload.ignore(1);
 
+        MySQLBinlogEventReadBuffer event_payload(payload);
         EventType event_type = static_cast<EventType>(*(event_payload.position() + 4));
         switch (event_type)
         {

From 3b34345abb06f0ab7c93dbb9300e6098b1165989 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Tue, 15 Sep 2020 18:42:46 +0300
Subject: [PATCH 255/341] Less flaky tests

---
 .../integration/test_backup_with_other_granularity/test.py | 4 ++--
 tests/integration/test_dictionaries_ddl/test.py            | 7 +++++--
 tests/integration/test_dictionary_custom_settings/test.py  | 5 ++++-
 3 files changed, 11 insertions(+), 5 deletions(-)

diff --git a/tests/integration/test_backup_with_other_granularity/test.py b/tests/integration/test_backup_with_other_granularity/test.py
index c27cd732a05..503544cbfc5 100644
--- a/tests/integration/test_backup_with_other_granularity/test.py
+++ b/tests/integration/test_backup_with_other_granularity/test.py
@@ -89,7 +89,7 @@ def test_backup_from_old_version_setting(started_cluster):
 
     assert node2.query("SELECT sum(A) FROM dest_table") == "3\n"
 
-    assert node1.query("CHECK TABLE dest_table") == "1\n"
+    assert node2.query("CHECK TABLE dest_table") == "1\n"
 
 
 def test_backup_from_old_version_config(started_cluster):
@@ -128,7 +128,7 @@ def test_backup_from_old_version_config(started_cluster):
 
     assert node3.query("SELECT sum(A) FROM dest_table") == "3\n"
 
-    assert node1.query("CHECK TABLE dest_table") == "1\n"
+    assert node3.query("CHECK TABLE dest_table") == "1\n"
 
 
 def test_backup_and_alter(started_cluster):
diff --git a/tests/integration/test_dictionaries_ddl/test.py b/tests/integration/test_dictionaries_ddl/test.py
index cc7536d4b36..6f52dba7deb 100644
--- a/tests/integration/test_dictionaries_ddl/test.py
+++ b/tests/integration/test_dictionaries_ddl/test.py
@@ -4,6 +4,7 @@ from helpers.cluster import ClickHouseCluster
 from helpers.client import QueryRuntimeException
 import pymysql
 import warnings
+import time
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 
@@ -243,6 +244,7 @@ def test_dictionary_with_where(started_cluster):
 
     assert node1.query("SELECT dictGetString('default.special_dict', 'value1', toUInt64(2))") == 'qweqwe\n'
 
+
 def test_clickhouse_remote(started_cluster):
     with pytest.raises(QueryRuntimeException):
         node3.query("""
@@ -256,7 +258,9 @@ def test_clickhouse_remote(started_cluster):
         SOURCE(CLICKHOUSE(HOST 'node4' PORT 9000 USER 'default' TABLE 'xml_dictionary_table' DB 'test'))
         LIFETIME(MIN 1 MAX 10)
         """)
-        node3.query("system reload dictionaries")
+        for i in range(5):
+            node3.query("system reload dictionary test.clickhouse_remote")
+            time.sleep(0.5)
 
     node3.query("detach dictionary if exists test.clickhouse_remote")
     node3.query("""
@@ -272,4 +276,3 @@ def test_clickhouse_remote(started_cluster):
         """)
 
     node3.query("select dictGetUInt8('test.clickhouse_remote', 'SomeValue1', toUInt64(17))") == '17\n'
-
diff --git a/tests/integration/test_dictionary_custom_settings/test.py b/tests/integration/test_dictionary_custom_settings/test.py
index e58b40df527..4cff5cb3e4a 100644
--- a/tests/integration/test_dictionary_custom_settings/test.py
+++ b/tests/integration/test_dictionary_custom_settings/test.py
@@ -39,9 +39,12 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_work(start_cluster):
     query = instance.query
 
+    instance.query("SYSTEM RELOAD DICTIONARIES")
+
     assert query("SELECT dictGetString('test_file', 'first', toUInt64(1))") == "\\\'a\n"
     assert query("SELECT dictGetString('test_file', 'second', toUInt64(1))") == "\"b\n"
     assert query("SELECT dictGetString('test_executable', 'first', toUInt64(1))") == "\\\'a\n"
@@ -58,4 +61,4 @@ def test_work(start_cluster):
     assert caught_exception.find("Limit for result exceeded") != -1
 
     assert query("SELECT dictGetString('test_http', 'first', toUInt64(1))") == "\\\'a\n"
-    assert query("SELECT dictGetString('test_http', 'second', toUInt64(1))") == "\"b\n"
\ No newline at end of file
+    assert query("SELECT dictGetString('test_http', 'second', toUInt64(1))") == "\"b\n"

From dc765b77e716a67be7df6729e76a3cc99c962de8 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Mon, 14 Sep 2020 23:29:49 -0700
Subject: [PATCH 256/341] Use std::chrono instead of clock_gettime

---
 src/Interpreters/ThreadStatusExt.cpp | 29 +++++++++++++++++++++-------
 src/Interpreters/executeQuery.cpp    | 24 ++++++++++++++++-------
 2 files changed, 39 insertions(+), 14 deletions(-)

diff --git a/src/Interpreters/ThreadStatusExt.cpp b/src/Interpreters/ThreadStatusExt.cpp
index 5766472156a..0f610d9f6d2 100644
--- a/src/Interpreters/ThreadStatusExt.cpp
+++ b/src/Interpreters/ThreadStatusExt.cpp
@@ -136,6 +136,22 @@ void ThreadStatus::attachQuery(const ThreadGroupStatusPtr & thread_group_, bool
     setupState(thread_group_);
 }
 
+inline UInt64 time_in_nanoseconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::nanoseconds>(timepoint.time_since_epoch()).count();
+}
+
+inline UInt64 time_in_microseconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::microseconds>(timepoint.time_since_epoch()).count();
+}
+
+
+inline UInt64 time_in_seconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::seconds>(timepoint.time_since_epoch()).count();
+}
+
 void ThreadStatus::initPerformanceCounters()
 {
     performance_counters_finalized = false;
@@ -146,14 +162,13 @@ void ThreadStatus::initPerformanceCounters()
     memory_tracker.resetCounters();
     memory_tracker.setDescription("(for thread)");
 
-    // query_start_time_{microseconds, nanoseconds} are all constructed from the same timespec
-    // to ensure that they are all atelast equal upto the precision of a second.
-    struct timespec ts;
-    clock_gettime(CLOCK_MONOTONIC, &ts);
+    // query_start_time_{microseconds, nanoseconds} are all constructed from the same time point
+    // to ensure that they are all equal upto the precision of a second.
+    const auto now = std::chrono::system_clock::now();
 
-    query_start_time_nanoseconds = UInt64(ts.tv_sec * 1000000000LL + ts.tv_nsec);
-    query_start_time = ts.tv_sec;
-    query_start_time_microseconds = UInt64((ts.tv_sec * 1000000LL) + (ts.tv_nsec / 1000));
+    query_start_time_nanoseconds = time_in_nanoseconds(now);
+    query_start_time = time_in_seconds(now);
+    query_start_time_microseconds = time_in_microseconds(now);
     ++queries_started;
 
     *last_rusage = RUsageCounters::current(query_start_time_nanoseconds);
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index be18fb20d29..74498f56776 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -182,6 +182,16 @@ static void logException(Context & context, QueryLogElement & elem)
             elem.exception, context.getClientInfo().current_address.toString(), joinLines(elem.query), elem.stack_trace);
 }
 
+inline UInt64 time_in_microseconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::microseconds>(timepoint.time_since_epoch()).count();
+}
+
+
+inline UInt64 time_in_seconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::seconds>(timepoint.time_since_epoch()).count();
+}
 
 static void onExceptionBeforeStart(const String & query_for_logging, Context & context, time_t current_time, UInt64 current_time_microseconds, ASTPtr ast)
 {
@@ -196,8 +206,9 @@ static void onExceptionBeforeStart(const String & query_for_logging, Context & c
 
     elem.type = QueryLogElementType::EXCEPTION_BEFORE_START;
 
-    // the assumption here is that the callers of onExceptionBeforeStart construct both params current_time and the current_time_microseconds
-    // from the same timespec so that both of the times are equal upto the precision of a second.
+    // all callers to onExceptionBeforeStart upstream construct the timespec for event_time and
+    // event_time_microseconds from the same timespec. So it can be assumed that both of these
+    // times are equal upto the precision of a second.
     elem.event_time = current_time;
     elem.query_start_time = current_time;
     elem.query_start_time_microseconds = current_time_microseconds;
@@ -253,13 +264,12 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
     bool has_query_tail,
     ReadBuffer * istr)
 {
-    // current_time and current_time_microseconds are both constructed from the same timespec
+    // current_time and current_time_microseconds are both constructed from the same time point
     // to ensure that both the times are equal upto the precision of a second.
-    struct timespec ts;
-    clock_gettime(CLOCK_MONOTONIC, &ts);
+    const auto now = std::chrono::system_clock::now();
 
-    time_t current_time = ts.tv_sec;
-    UInt64 current_time_microseconds = UInt64((ts.tv_sec * 1000000LL) + (ts.tv_nsec / 1000));
+    auto current_time = time_in_seconds(now);
+    auto current_time_microseconds = time_in_microseconds(now);
 
     /// If we already executing query and it requires to execute internal query, than
     /// don't replace thread context with given (it can be temporary). Otherwise, attach context to thread.

From 21bc856d6185b6d0d847b7e9f1d5bc6a4b9f5e40 Mon Sep 17 00:00:00 2001
From: Vladimir Golovchenko <vladimirg@pressreader.com>
Date: Tue, 15 Sep 2020 11:26:57 -0700
Subject: [PATCH 257/341] Improved the description of connecting to MS SQL
 Server by ODBC.

---
 .../external-dicts-dict-sources.md            | 22 ++++++++++++++-----
 1 file changed, 16 insertions(+), 6 deletions(-)

diff --git a/docs/en/sql-reference/dictionaries/external-dictionaries/external-dicts-dict-sources.md b/docs/en/sql-reference/dictionaries/external-dictionaries/external-dicts-dict-sources.md
index 98f0a5ffb4c..957f2b6ae53 100644
--- a/docs/en/sql-reference/dictionaries/external-dictionaries/external-dicts-dict-sources.md
+++ b/docs/en/sql-reference/dictionaries/external-dictionaries/external-dicts-dict-sources.md
@@ -246,7 +246,7 @@ Installing unixODBC and the ODBC driver for PostgreSQL:
 $ sudo apt-get install -y unixodbc odbcinst odbc-postgresql
 ```
 
-Configuring `/etc/odbc.ini` (or `~/.odbc.ini`):
+Configuring `/etc/odbc.ini` (or `~/.odbc.ini` if you signed in under a user that runs ClickHouse):
 
 ``` text
     [DEFAULT]
@@ -321,7 +321,7 @@ You may need to edit `odbc.ini` to specify the full path to the library with the
 
 Ubuntu OS.
 
-Installing the driver: :
+Installing the ODBC driver for connecting to MS SQL:
 
 ``` bash
 $ sudo apt-get install tdsodbc freetds-bin sqsh
@@ -329,7 +329,7 @@ $ sudo apt-get install tdsodbc freetds-bin sqsh
 
 Configuring the driver:
 
-``` bash
+```bash
     $ cat /etc/freetds/freetds.conf
     ...
 
@@ -339,8 +339,11 @@ Configuring the driver:
     tds version = 7.0
     client charset = UTF-8
 
+    # test TDS connection
+    $ sqsh -S MSSQL -D database -U user -P password
+
+
     $ cat /etc/odbcinst.ini
-    ...
 
     [FreeTDS]
     Description     = FreeTDS
@@ -349,8 +352,8 @@ Configuring the driver:
     FileUsage       = 1
     UsageCount      = 5
 
-    $ cat ~/.odbc.ini
-    ...
+    $ cat /etc/odbc.ini
+    # $ cat ~/.odbc.ini # if you signed in under a user that runs ClickHouse
 
     [MSSQL]
     Description     = FreeTDS
@@ -360,8 +363,15 @@ Configuring the driver:
     UID             = test
     PWD             = test
     Port            = 1433
+
+
+    # (optional) test ODBC connection (to use isql-tool install the [unixodbc](https://packages.debian.org/sid/unixodbc)-package)
+    $ isql -v MSSQL "user" "password"
 ```
 
+Remarks:
+- to determine the earliest TDS version that is supported by a particular SQL Server version, refer to the product documentation or look at [MS-TDS Product Behavior](https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-tds/135d0ebe-5c4c-4a94-99bf-1811eccb9f4a)
+
 Configuring the dictionary in ClickHouse:
 
 ``` xml

From a35c1f8ed00fd031f015fe68d6770a96af3c1663 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 16 Sep 2020 00:35:49 +0300
Subject: [PATCH 258/341] Do not check client's host when user comes from
 interserver secret

---
 src/Interpreters/Context.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 3138193a783..4210c3be1fc 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -694,7 +694,9 @@ void Context::setUserImpl(const String & name, const std::optional<String> & pas
     if (new_user_id)
     {
         new_access = getAccessControlManager().getContextAccess(*new_user_id, {}, true, settings, current_database, client_info);
-        if (!new_access->isClientHostAllowed() || (password && !new_access->isCorrectPassword(*password)))
+        /// Access w/o password is done under interserver-secret (remote_servers.secret)
+        /// So it is okay not to check client's host (since there is trust).
+        if (password && (!new_access->isClientHostAllowed() || !new_access->isCorrectPassword(*password)))
         {
             new_user_id = {};
             new_access = nullptr;

From 9100dcd37aa5b873d357888b17def7936cb9311a Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Wed, 16 Sep 2020 11:13:17 +0800
Subject: [PATCH 259/341] fix build and test failure

---
 src/IO/MySQLBinlogEventReadBuffer.cpp               | 13 +++++++++++++
 src/IO/MySQLBinlogEventReadBuffer.h                 |  2 ++
 .../tests/gtest_mysql_binlog_event_read_buffer.cpp  | 11 +++++------
 3 files changed, 20 insertions(+), 6 deletions(-)

diff --git a/src/IO/MySQLBinlogEventReadBuffer.cpp b/src/IO/MySQLBinlogEventReadBuffer.cpp
index 0680e075af9..9cc7fd4e2ba 100644
--- a/src/IO/MySQLBinlogEventReadBuffer.cpp
+++ b/src/IO/MySQLBinlogEventReadBuffer.cpp
@@ -59,4 +59,17 @@ bool MySQLBinlogEventReadBuffer::nextImpl()
     return true;
 }
 
+MySQLBinlogEventReadBuffer::~MySQLBinlogEventReadBuffer()
+{
+    try
+    {
+        /// ignore last 4 bytes
+        nextIfAtEnd();
+    }
+    catch (...)
+    {
+        tryLogCurrentException(__PRETTY_FUNCTION__);
+    }
+}
+
 }
diff --git a/src/IO/MySQLBinlogEventReadBuffer.h b/src/IO/MySQLBinlogEventReadBuffer.h
index 7a19461e57e..e9452aa551e 100644
--- a/src/IO/MySQLBinlogEventReadBuffer.h
+++ b/src/IO/MySQLBinlogEventReadBuffer.h
@@ -18,6 +18,8 @@ protected:
     bool nextImpl() override;
 
 public:
+    ~MySQLBinlogEventReadBuffer() override;
+
     MySQLBinlogEventReadBuffer(ReadBuffer & in_);
 
 };
diff --git a/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp b/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
index 66077bcba5b..f4d39c73a7c 100644
--- a/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
+++ b/src/IO/tests/gtest_mysql_binlog_event_read_buffer.cpp
@@ -13,8 +13,7 @@ TEST(MySQLBinlogEventReadBuffer, CheckBoundary)
         std::vector<char> memory_data(index, 0x01);
         ReadBufferFromMemory nested_in(memory_data.data(), index);
 
-        MySQLBinlogEventReadBuffer binlog_in(nested_in);
-        EXPECT_THROW(binlog_in.ignore(), Exception);
+        EXPECT_THROW({ MySQLBinlogEventReadBuffer binlog_in(nested_in); }, Exception);
     }
 }
 
@@ -50,8 +49,8 @@ TEST(MySQLBinlogEventReadBuffer, BadBufferSizes)
     MySQLBinlogEventReadBuffer binlog_in(concat_buffer);
     binlog_in.readStrict(res, 4);
 
-    for (size_t index = 0; index < 4; ++index)
-        ASSERT_EQ(res[index], 0x01);
+    for (const auto & res_byte : res)
+        ASSERT_EQ(res_byte, 0x01);
 
     ASSERT_TRUE(binlog_in.eof());
 }
@@ -75,8 +74,8 @@ TEST(MySQLBinlogEventReadBuffer, NiceAndBadBufferSizes)
     MySQLBinlogEventReadBuffer binlog_in(concat_buffer);
     binlog_in.readStrict(res, 12);
 
-    for (size_t index = 0; index < 12; ++index)
-        ASSERT_EQ(res[index], 0x01);
+    for (const auto & res_byte : res)
+        ASSERT_EQ(res_byte, 0x01);
 
     ASSERT_TRUE(binlog_in.eof());
 }

From 85e990f5184099d107d0957731085a32212f41c7 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Wed, 16 Sep 2020 11:30:14 +0800
Subject: [PATCH 260/341] Fix code style

---
 src/IO/MySQLBinlogEventReadBuffer.cpp | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/src/IO/MySQLBinlogEventReadBuffer.cpp b/src/IO/MySQLBinlogEventReadBuffer.cpp
index 9cc7fd4e2ba..3a2aba045d3 100644
--- a/src/IO/MySQLBinlogEventReadBuffer.cpp
+++ b/src/IO/MySQLBinlogEventReadBuffer.cpp
@@ -4,11 +4,6 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
-
 MySQLBinlogEventReadBuffer::MySQLBinlogEventReadBuffer(ReadBuffer & in_)
     : ReadBuffer(nullptr, 0, 0), in(in_)
 {

From b75963d37037e5209920b8db535321021c470d39 Mon Sep 17 00:00:00 2001
From: bharatnc <bharatnc@gmail.com>
Date: Tue, 15 Sep 2020 21:26:10 -0700
Subject: [PATCH 261/341] Format and optimize imports in integration test files

This PR formats all the `*.py` files found under the `tests/integration`
folder. It also reorders the imports and cleans up a bunch of unused
imports.

The formatting also takes care of other things like wrapping lines and
fixing spaces and indents such that the tests look more readable.
---
 tests/integration/conftest.py                 |   1 +
 tests/integration/helpers/client.py           |  37 +-
 tests/integration/helpers/cluster.py          | 134 ++++---
 tests/integration/helpers/dictionary.py       |  21 +-
 tests/integration/helpers/external_sources.py |  72 ++--
 tests/integration/helpers/hdfs_api.py         |  24 +-
 tests/integration/helpers/http_server.py      |   7 +-
 tests/integration/helpers/network.py          |  14 +-
 tests/integration/helpers/test_tools.py       |  14 +-
 tests/integration/helpers/uclient.py          |   3 +-
 tests/integration/helpers/uexpect.py          |  19 +-
 .../test_SYSTEM_FLUSH_LOGS/test.py            |   4 +
 .../test_access_control_on_cluster/test.py    |   3 +-
 .../test_adaptive_granularity/test.py         | 372 ++++++++++--------
 .../test.py                                   |  11 +-
 .../test.py                                   |  43 +-
 .../test_aggregation_memory_efficient/test.py |  27 +-
 .../test_allowed_client_hosts/test.py         |  36 +-
 .../test_allowed_url_from_config/test.py      |  88 +++--
 tests/integration/test_alter_codec/test.py    |   6 +-
 .../test_always_fetch_merged/test.py          |   5 +-
 .../test.py                                   |   2 +-
 .../test_atomic_drop_table/test.py            |  11 +-
 .../test_attach_without_checksums/test.py     |  11 +-
 tests/integration/test_authentication/test.py |   7 +-
 tests/integration/test_backup_restore/test.py |  27 +-
 .../test.py                                   |  36 +-
 .../test_backward_compatibility/test.py       |  13 +-
 .../test_aggregate_function_state_avg.py      |  21 +-
 .../test_short_strings_aggregation.py         |  11 +-
 .../test_block_structure_mismatch/test.py     |   9 +-
 tests/integration/test_check_table/test.py    |  68 ++--
 .../test.py                                   |  29 +-
 .../test_cluster_all_replicas/test.py         |   1 +
 tests/integration/test_cluster_copier/test.py | 143 ++++---
 .../test_cluster_copier/trivial_test.py       |  26 +-
 .../test.py                                   |   7 +-
 .../test_concurrent_ttl_merges/test.py        |  35 +-
 .../test_config_corresponding_root/test.py    |   4 +-
 .../test_config_substitutions/test.py         |  54 ++-
 .../test.py                                   |   9 +-
 .../test.py                                   |  17 +-
 .../test_cross_replication/test.py            |   3 +-
 .../integration/test_custom_settings/test.py  |  16 +-
 .../integration/test_ddl_alter_query/test.py  |  12 +-
 .../test_default_compression_codec/test.py    | 105 +++--
 .../test_default_database_on_cluster/test.py  |  30 +-
 tests/integration/test_default_role/test.py   |  21 +-
 .../test_delayed_replica_failover/test.py     |  15 +-
 .../test_dictionaries_access/test.py          |   2 +-
 .../test.py                                   |  22 +-
 .../test.py                                   |  26 +-
 .../integration/test_dictionaries_ddl/test.py |  61 ++-
 .../test_dictionaries_dependency/test.py      |  32 +-
 .../test_dictionaries_dependency_xml/test.py  |  10 +-
 .../test_dictionaries_mysql/test.py           |  25 +-
 .../test_dictionaries_null_value/test.py      |   7 +-
 .../test_dictionaries_redis/test.py           |  16 +-
 .../generate_dictionaries.py                  |   4 +-
 .../test_dictionaries_select_all/test.py      |   8 +-
 .../test.py                                   |  45 ++-
 .../test_default_reading.py                   |  34 +-
 .../test_default_string.py                    |  12 +-
 .../test_dict_get.py                          |  12 +-
 .../test_dict_get_or_default.py               |  36 +-
 .../http_server.py                            |   7 +-
 .../test_dictionary_custom_settings/test.py   |   8 +-
 .../test_dictionary_ddl_on_cluster/test.py    |  30 +-
 .../test_disk_access_storage/test.py          |  33 +-
 tests/integration/test_disk_types/test.py     |  14 +-
 .../test.py                                   |  15 +-
 .../test_distributed_ddl/cluster.py           |  30 +-
 .../integration/test_distributed_ddl/test.py  | 123 +++---
 .../test_replicated_alter.py                  |  24 +-
 .../test.py                                   |   9 +-
 .../test_distributed_ddl_password/test.py     |  70 ++--
 .../test_distributed_format/test.py           |  25 +-
 .../test_distributed_load_balancing/test.py   |  15 +-
 .../test_distributed_over_distributed/test.py |  22 +-
 .../test_distributed_over_live_view/test.py   |  25 +-
 .../test.py                                   |   7 +-
 .../test.py                                   |  10 +-
 .../test_distributed_system_query/test.py     |   6 +-
 tests/integration/test_drop_replica/test.py   | 119 +++---
 .../test_enabling_access_management/test.py   |   1 +
 .../test_extreme_deduplication/test.py        |  26 +-
 .../test.py                                   |   8 +-
 .../test_filesystem_layout/test.py            |   3 +-
 .../test_force_deduplication/test.py          |  11 +-
 .../test_format_avro_confluent/test.py        |  18 +-
 .../test_format_schema_on_server/test.py      |   3 +-
 tests/integration/test_freeze_table/test.py   |   4 +-
 .../test_globs_in_filepath/test.py            |  40 +-
 .../integration/test_grant_and_revoke/test.py |  93 +++--
 .../test_graphite_merge_tree/test.py          |  27 +-
 tests/integration/test_host_ip_change/test.py |  53 ++-
 .../test_http_and_readonly/test.py            |   6 +-
 .../test_http_handlers_config/test.py         | 150 ++++---
 .../test_https_replication/test.py            |  54 ++-
 .../test_inherit_multiple_profiles/test.py    |   1 -
 .../test.py                                   |   7 +-
 .../test.py                                   |  18 +-
 .../test_insert_into_distributed/test.py      |  25 +-
 .../test.py                                   |  12 +-
 .../test.py                                   |  18 +-
 .../test_live_view_over_distributed/test.py   |  24 +-
 tests/integration/test_log_family_s3/test.py  |  10 +-
 tests/integration/test_logs_level/test.py     |   2 +
 .../test.py                                   |  10 +-
 .../materialize_with_ddl.py                   | 207 ++++++----
 .../test_materialize_mysql_database/test.py   |  50 ++-
 .../test.py                                   |  50 ++-
 .../test_merge_table_over_distributed/test.py |  17 +-
 tests/integration/test_merge_tree_s3/test.py  |  61 ++-
 tests/integration/test_multiple_disks/test.py | 296 ++++++++------
 .../test_mutations_hardlinks/test.py          |  34 +-
 .../test_mutations_with_merge_tree/test.py    |  32 +-
 .../test_mysql_database_engine/test.py        | 141 ++++---
 tests/integration/test_mysql_protocol/test.py | 115 ++++--
 .../test_no_local_metadata_node/test.py       |   2 +-
 .../test_non_default_compression/test.py      |  84 ++--
 .../integration/test_odbc_interaction/test.py | 139 +++++--
 tests/integration/test_old_versions/test.py   |  39 +-
 .../test_on_cluster_timeouts/test.py          |  28 +-
 tests/integration/test_part_log_table/test.py |   5 +-
 tests/integration/test_partition/test.py      |  15 +-
 .../test_parts_delete_zookeeper/test.py       |   7 +-
 .../test_polymorphic_parts/test.py            | 202 ++++++----
 .../test_postgresql_protocol/test.py          |  46 ++-
 .../test_profile_events_s3/test.py            |  64 +--
 .../test_prometheus_endpoint/test.py          |   6 +-
 tests/integration/test_quorum_inserts/test.py |  63 +--
 tests/integration/test_quota/test.py          | 259 +++++++-----
 tests/integration/test_random_inserts/test.py |  44 ++-
 .../test.py                                   |   5 +-
 .../test.py                                   |   6 +-
 .../test_recompression_ttl/test.py            |  25 +-
 .../integration/test_recovery_replica/test.py |  19 +-
 .../test_redirect_url_storage/test.py         |  16 +-
 .../test_relative_filepath/test.py            |   2 +
 .../test.py                                   |   6 +-
 .../test.py                                   |  93 +++--
 .../integration/test_remote_prewhere/test.py  |   7 +-
 tests/integration/test_rename_column/test.py  |  57 +--
 .../test_replace_partition/test.py            |  53 +--
 .../test_replica_can_become_leader/test.py    |   4 +-
 .../test_replicated_merge_tree_s3/test.py     |  18 +-
 .../test_replicated_mutations/test.py         |  37 +-
 .../test_replicated_parse_zk_metadata/test.py |  20 +-
 .../test_replicating_constants/test.py        |   6 +-
 .../test_replication_credentials/test.py      |  46 ++-
 .../test.py                                   |   4 +-
 tests/integration/test_role/test.py           |  82 ++--
 tests/integration/test_row_policy/test.py     | 205 +++++++---
 tests/integration/test_s3_with_https/test.py  |   6 +-
 .../proxy-resolver/resolver.py                |   3 +-
 tests/integration/test_s3_with_proxy/test.py  |   6 +-
 .../fake_sentry_server.py                     |   1 +
 .../test_send_crash_reports/test.py           |   7 +-
 .../test.py                                   |  26 +-
 .../test_server_initialization/test.py        |  14 +-
 .../test_settings_constraints/test.py         |  10 +-
 .../test.py                                   |  81 ++--
 .../integration/test_settings_profile/test.py | 170 +++++---
 tests/integration/test_storage_hdfs/test.py   |  79 ++--
 .../test_storage_kafka/kafka_pb2.py           |  97 +++--
 tests/integration/test_storage_kafka/test.py  | 280 +++++++------
 .../integration/test_storage_mongodb/test.py  |  15 +-
 tests/integration/test_storage_mysql/test.py  |  46 ++-
 .../test_storage_rabbitmq/rabbitmq_pb2.py     |  98 +++--
 .../integration/test_storage_rabbitmq/test.py |  79 ++--
 tests/integration/test_storage_s3/test.py     |  16 +-
 tests/integration/test_system_merges/test.py  |  26 +-
 tests/integration/test_system_queries/test.py |  54 ++-
 tests/integration/test_text_log_level/test.py |   5 +-
 .../integration/test_timezone_config/test.py  |   2 +
 tests/integration/test_tmp_policy/test.py     |  10 +-
 tests/integration/test_ttl_move/test.py       | 319 +++++++++------
 tests/integration/test_ttl_replicated/test.py | 125 +++---
 tests/integration/test_union_header/test.py   |   1 -
 .../integration/test_user_directories/test.py |  56 ++-
 .../test_user_ip_restrictions/test.py         |  53 ++-
 .../test_user_zero_database_access.py         |  28 +-
 .../test.py                                   |  20 +-
 .../integration/test_zookeeper_config/test.py |  54 ++-
 185 files changed, 4663 insertions(+), 3093 deletions(-)

diff --git a/tests/integration/conftest.py b/tests/integration/conftest.py
index 167524b9582..baa04134c7d 100644
--- a/tests/integration/conftest.py
+++ b/tests/integration/conftest.py
@@ -1,5 +1,6 @@
 from helpers.test_tools import TSV
 
+
 def pytest_assertrepr_compare(op, left, right):
     if isinstance(left, TSV) and isinstance(right, TSV) and op == '==':
         return ['TabSeparated values differ: '] + left.diff(right)
diff --git a/tests/integration/helpers/client.py b/tests/integration/helpers/client.py
index 78c5bba09f3..deffa20753f 100644
--- a/tests/integration/helpers/client.py
+++ b/tests/integration/helpers/client.py
@@ -1,8 +1,7 @@
-import errno
-import subprocess as sp
-from threading import Timer
-import tempfile
 import os
+import subprocess as sp
+import tempfile
+from threading import Timer
 
 
 class Client:
@@ -16,12 +15,13 @@ class Client:
 
         self.command += ['--host', self.host, '--port', str(self.port), '--stacktrace']
 
+    def query(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None,
+              ignore_error=False):
+        return self.get_query_request(sql, stdin=stdin, timeout=timeout, settings=settings, user=user,
+                                      password=password, database=database, ignore_error=ignore_error).get_answer()
 
-    def query(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None, ignore_error=False):
-        return self.get_query_request(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password, database=database, ignore_error=ignore_error).get_answer()
-
-
-    def get_query_request(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None, ignore_error=False):
+    def get_query_request(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None,
+                          ignore_error=False):
         command = self.command[:]
 
         if stdin is None:
@@ -45,14 +45,17 @@ class Client:
 
         return CommandRequest(command, stdin, timeout, ignore_error)
 
+    def query_and_get_error(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None,
+                            database=None):
+        return self.get_query_request(sql, stdin=stdin, timeout=timeout, settings=settings, user=user,
+                                      password=password, database=database).get_error()
 
-    def query_and_get_error(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None):
-        return self.get_query_request(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password, database=database).get_error()
+    def query_and_get_answer_with_error(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None,
+                                        database=None):
+        return self.get_query_request(sql, stdin=stdin, timeout=timeout, settings=settings, user=user,
+                                      password=password, database=database).get_answer_and_error()
 
 
-    def query_and_get_answer_with_error(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None):
-        return self.get_query_request(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password, database=database).get_answer_and_error()
-
 class QueryTimeoutExceedException(Exception):
     pass
 
@@ -90,7 +93,6 @@ class CommandRequest:
             self.timer = Timer(timeout, kill_process)
             self.timer.start()
 
-
     def get_answer(self):
         self.process.wait()
         self.stdout_file.seek(0)
@@ -103,11 +105,11 @@ class CommandRequest:
             raise QueryTimeoutExceedException('Client timed out!')
 
         if (self.process.returncode != 0 or stderr) and not self.ignore_error:
-            raise QueryRuntimeException('Client failed! Return code: {}, stderr: {}'.format(self.process.returncode, stderr))
+            raise QueryRuntimeException(
+                'Client failed! Return code: {}, stderr: {}'.format(self.process.returncode, stderr))
 
         return stdout
 
-
     def get_error(self):
         self.process.wait()
         self.stdout_file.seek(0)
@@ -124,7 +126,6 @@ class CommandRequest:
 
         return stderr
 
-
     def get_answer_and_error(self):
         self.process.wait()
         self.stdout_file.seek(0)
diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 4d336838eb7..f5d9290a17e 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1,30 +1,31 @@
 import base64
-import cassandra.cluster
-import docker
 import errno
 import httplib
 import logging
 import os
 import os.path as p
 import pprint
-import psycopg2
 import pwd
-import pymongo
-import pymysql
 import re
-import requests
 import shutil
 import socket
 import subprocess
 import time
-import urllib
 import traceback
+import urllib
+
+import cassandra.cluster
+import docker
+import psycopg2
+import pymongo
+import pymysql
+import requests
 import xml.dom.minidom
+from confluent.schemaregistry.client import CachedSchemaRegistryClient
 from dicttoxml import dicttoxml
 from kazoo.client import KazooClient
 from kazoo.exceptions import KazooException
 from minio import Minio
-from confluent.schemaregistry.client import CachedSchemaRegistryClient
 
 from .client import Client
 from .hdfs_api import HDFSApi
@@ -67,13 +68,14 @@ def get_odbc_bridge_path():
             return '/usr/bin/clickhouse-odbc-bridge'
     return path
 
+
 def get_docker_compose_path():
     compose_path = os.environ.get('DOCKER_COMPOSE_DIR')
     if compose_path is not None:
         return os.path.dirname(compose_path)
     else:
         if os.path.exists(os.path.dirname('/compose/')):
-            return os.path.dirname('/compose/') #default in docker runner container
+            return os.path.dirname('/compose/')  # default in docker runner container
         else:
             print("Fallback docker_compose_path to LOCAL_DOCKER_COMPOSE_DIR: {}".format(LOCAL_DOCKER_COMPOSE_DIR))
             return LOCAL_DOCKER_COMPOSE_DIR
@@ -91,12 +93,12 @@ class ClickHouseCluster:
     def __init__(self, base_path, name=None, base_config_dir=None, server_bin_path=None, client_bin_path=None,
                  odbc_bridge_bin_path=None, zookeeper_config_path=None, custom_dockerd_host=None):
         for param in os.environ.keys():
-            print "ENV %40s %s" % (param,os.environ[param])
+            print "ENV %40s %s" % (param, os.environ[param])
         self.base_dir = p.dirname(base_path)
         self.name = name if name is not None else ''
 
         self.base_config_dir = base_config_dir or os.environ.get('CLICKHOUSE_TESTS_BASE_CONFIG_DIR',
-                                                                   '/etc/clickhouse-server/')
+                                                                 '/etc/clickhouse-server/')
         self.server_bin_path = p.realpath(
             server_bin_path or os.environ.get('CLICKHOUSE_TESTS_SERVER_BIN_PATH', '/usr/bin/clickhouse'))
         self.odbc_bridge_bin_path = p.realpath(odbc_bridge_bin_path or get_odbc_bridge_path())
@@ -165,8 +167,10 @@ class ClickHouseCluster:
             cmd += " client"
         return cmd
 
-    def add_instance(self, name, base_config_dir=None, main_configs=None, user_configs=None, dictionaries = None, macros=None,
-                     with_zookeeper=False, with_mysql=False, with_kafka=False, with_rabbitmq=False, clickhouse_path_dir=None,
+    def add_instance(self, name, base_config_dir=None, main_configs=None, user_configs=None, dictionaries=None,
+                     macros=None,
+                     with_zookeeper=False, with_mysql=False, with_kafka=False, with_rabbitmq=False,
+                     clickhouse_path_dir=None,
                      with_odbc_drivers=False, with_postgres=False, with_hdfs=False, with_mongo=False,
                      with_redis=False, with_minio=False, with_cassandra=False,
                      hostname=None, env_variables=None, image="yandex/clickhouse-integration-test", tag=None,
@@ -247,7 +251,8 @@ class ClickHouseCluster:
             self.with_mysql = True
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_mysql.yml')])
             self.base_mysql_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                   self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_mysql.yml')]
+                                   self.project_name, '--file',
+                                   p.join(docker_compose_yml_dir, 'docker_compose_mysql.yml')]
 
             cmds.append(self.base_mysql_cmd)
 
@@ -255,7 +260,8 @@ class ClickHouseCluster:
             self.with_postgres = True
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_postgres.yml')])
             self.base_postgres_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                      self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_postgres.yml')]
+                                      self.project_name, '--file',
+                                      p.join(docker_compose_yml_dir, 'docker_compose_postgres.yml')]
             cmds.append(self.base_postgres_cmd)
 
         if with_odbc_drivers and not self.with_odbc_drivers:
@@ -264,7 +270,8 @@ class ClickHouseCluster:
                 self.with_mysql = True
                 self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_mysql.yml')])
                 self.base_mysql_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                       self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_mysql.yml')]
+                                       self.project_name, '--file',
+                                       p.join(docker_compose_yml_dir, 'docker_compose_mysql.yml')]
                 cmds.append(self.base_mysql_cmd)
 
             if not self.with_postgres:
@@ -279,28 +286,32 @@ class ClickHouseCluster:
             self.with_kafka = True
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_kafka.yml')])
             self.base_kafka_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                   self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_kafka.yml')]
+                                   self.project_name, '--file',
+                                   p.join(docker_compose_yml_dir, 'docker_compose_kafka.yml')]
             cmds.append(self.base_kafka_cmd)
 
         if with_rabbitmq and not self.with_rabbitmq:
             self.with_rabbitmq = True
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_rabbitmq.yml')])
             self.base_rabbitmq_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                      self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_rabbitmq.yml')]
+                                      self.project_name, '--file',
+                                      p.join(docker_compose_yml_dir, 'docker_compose_rabbitmq.yml')]
             cmds.append(self.base_rabbitmq_cmd)
 
         if with_hdfs and not self.with_hdfs:
             self.with_hdfs = True
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_hdfs.yml')])
             self.base_hdfs_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                  self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_hdfs.yml')]
+                                  self.project_name, '--file',
+                                  p.join(docker_compose_yml_dir, 'docker_compose_hdfs.yml')]
             cmds.append(self.base_hdfs_cmd)
 
         if with_mongo and not self.with_mongo:
             self.with_mongo = True
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_mongo.yml')])
             self.base_mongo_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                   self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_mongo.yml')]
+                                   self.project_name, '--file',
+                                   p.join(docker_compose_yml_dir, 'docker_compose_mongo.yml')]
             cmds.append(self.base_mongo_cmd)
 
         if self.with_net_trics:
@@ -311,21 +322,24 @@ class ClickHouseCluster:
             self.with_redis = True
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_redis.yml')])
             self.base_redis_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                   self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_redis.yml')]
+                                   self.project_name, '--file',
+                                   p.join(docker_compose_yml_dir, 'docker_compose_redis.yml')]
 
         if with_minio and not self.with_minio:
             self.with_minio = True
             self.minio_certs_dir = minio_certs_dir
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_minio.yml')])
             self.base_minio_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                   self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_minio.yml')]
+                                   self.project_name, '--file',
+                                   p.join(docker_compose_yml_dir, 'docker_compose_minio.yml')]
             cmds.append(self.base_minio_cmd)
 
         if with_cassandra and not self.with_cassandra:
             self.with_cassandra = True
             self.base_cmd.extend(['--file', p.join(docker_compose_yml_dir, 'docker_compose_cassandra.yml')])
             self.base_cassandra_cmd = ['docker-compose', '--project-directory', self.base_dir, '--project-name',
-                                       self.project_name, '--file', p.join(docker_compose_yml_dir, 'docker_compose_cassandra.yml')]
+                                       self.project_name, '--file',
+                                       p.join(docker_compose_yml_dir, 'docker_compose_cassandra.yml')]
 
         return instance
 
@@ -390,7 +404,8 @@ class ClickHouseCluster:
             print("Container {} uses image {}: ".format(container_id, image_id))
             pprint.pprint(image_info)
             print("")
-            message = 'Cmd "{}" failed in container {}. Return code {}. Output: {}'.format(' '.join(cmd), container_id, exit_code, output)
+            message = 'Cmd "{}" failed in container {}. Return code {}. Output: {}'.format(' '.join(cmd), container_id,
+                                                                                           exit_code, output)
             if nothrow:
                 print(message)
             else:
@@ -401,7 +416,8 @@ class ClickHouseCluster:
         with open(local_path, 'r') as fdata:
             data = fdata.read()
             encoded_data = base64.b64encode(data)
-            self.exec_in_container(container_id, ["bash", "-c", "echo {} | base64 --decode > {}".format(encoded_data, dest_path)],
+            self.exec_in_container(container_id,
+                                   ["bash", "-c", "echo {} | base64 --decode > {}".format(encoded_data, dest_path)],
                                    user='root')
 
     def wait_mysql_to_start(self, timeout=60):
@@ -650,7 +666,6 @@ class ClickHouseCluster:
             subprocess_check_call(clickhouse_start_cmd)
             print("ClickHouse instance created")
 
-
             start_deadline = time.time() + 20.0  # seconds
             for instance in self.instances.itervalues():
                 instance.docker_client = self.docker_client
@@ -692,7 +707,7 @@ class ClickHouseCluster:
         try:
             subprocess_check_call(self.base_cmd + ['down', '--volumes', '--remove-orphans'])
         except Exception as e:
-                print "Down + remove orphans failed durung shutdown. {}".format(repr(e))
+            print "Down + remove orphans failed durung shutdown. {}".format(repr(e))
 
         self.is_up = False
 
@@ -704,23 +719,26 @@ class ClickHouseCluster:
             instance.client = None
 
         if not self.zookeeper_use_tmpfs:
-             for i in range(1, 4):
-                 zk_data_path = self.instances_dir + '/zkdata' + str(i)
-                 zk_log_data_path = self.instances_dir + '/zklog' + str(i)
-                 if os.path.exists(zk_data_path):
-                     shutil.rmtree(zk_data_path)
-                 if os.path.exists(zk_log_data_path):
-                     shutil.rmtree(zk_log_data_path)
+            for i in range(1, 4):
+                zk_data_path = self.instances_dir + '/zkdata' + str(i)
+                zk_log_data_path = self.instances_dir + '/zklog' + str(i)
+                if os.path.exists(zk_data_path):
+                    shutil.rmtree(zk_data_path)
+                if os.path.exists(zk_log_data_path):
+                    shutil.rmtree(zk_log_data_path)
 
         if sanitizer_assert_instance is not None:
-            raise Exception("Sanitizer assert found in {} for instance {}".format(self.docker_logs_path, sanitizer_assert_instance))
+            raise Exception(
+                "Sanitizer assert found in {} for instance {}".format(self.docker_logs_path, sanitizer_assert_instance))
 
     def pause_container(self, instance_name):
         subprocess_check_call(self.base_cmd + ['pause', instance_name])
+
     #    subprocess_check_call(self.base_cmd + ['kill', '-s SIGSTOP', instance_name])
 
     def unpause_container(self, instance_name):
         subprocess_check_call(self.base_cmd + ['unpause', instance_name])
+
     #    subprocess_check_call(self.base_cmd + ['kill', '-s SIGCONT', instance_name])
 
     def open_bash_shell(self, instance_name):
@@ -790,9 +808,12 @@ services:
 class ClickHouseInstance:
 
     def __init__(
-            self, cluster, base_path, name, base_config_dir, custom_main_configs, custom_user_configs, custom_dictionaries,
-            macros, with_zookeeper, zookeeper_config_path, with_mysql, with_kafka, with_rabbitmq, with_mongo, with_redis, with_minio,
-            with_cassandra, server_bin_path, odbc_bridge_bin_path, clickhouse_path_dir, with_odbc_drivers, hostname=None, env_variables=None,
+            self, cluster, base_path, name, base_config_dir, custom_main_configs, custom_user_configs,
+            custom_dictionaries,
+            macros, with_zookeeper, zookeeper_config_path, with_mysql, with_kafka, with_rabbitmq, with_mongo,
+            with_redis, with_minio,
+            with_cassandra, server_bin_path, odbc_bridge_bin_path, clickhouse_path_dir, with_odbc_drivers,
+            hostname=None, env_variables=None,
             image="yandex/clickhouse-integration-test", tag="latest",
             stay_alive=False, ipv4_address=None, ipv6_address=None, with_installed_binary=False, tmpfs=None):
 
@@ -848,15 +869,19 @@ class ClickHouseInstance:
         return "-fsanitize=thread" in build_opts
 
     # Connects to the instance via clickhouse-client, sends a query (1st argument) and returns the answer
-    def query(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None, ignore_error=False):
-        return self.client.query(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password, database=database, ignore_error=ignore_error)
+    def query(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None,
+              ignore_error=False):
+        return self.client.query(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password,
+                                 database=database, ignore_error=ignore_error)
 
-    def query_with_retry(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None, ignore_error=False,
+    def query_with_retry(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None,
+                         ignore_error=False,
                          retry_count=20, sleep_time=0.5, check_callback=lambda x: True):
         result = None
         for i in range(retry_count):
             try:
-                result = self.query(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password, database=database, ignore_error=ignore_error)
+                result = self.query(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password,
+                                    database=database, ignore_error=ignore_error)
                 if check_callback(result):
                     return result
                 time.sleep(sleep_time)
@@ -873,12 +898,16 @@ class ClickHouseInstance:
         return self.client.get_query_request(*args, **kwargs)
 
     # Connects to the instance via clickhouse-client, sends a query (1st argument), expects an error and return its code
-    def query_and_get_error(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None):
-        return self.client.query_and_get_error(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password, database=database)
+    def query_and_get_error(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None,
+                            database=None):
+        return self.client.query_and_get_error(sql, stdin=stdin, timeout=timeout, settings=settings, user=user,
+                                               password=password, database=database)
 
     # The same as query_and_get_error but ignores successful query.
-    def query_and_get_answer_with_error(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None, database=None):
-        return self.client.query_and_get_answer_with_error(sql, stdin=stdin, timeout=timeout, settings=settings, user=user, password=password, database=database)
+    def query_and_get_answer_with_error(self, sql, stdin=None, timeout=None, settings=None, user=None, password=None,
+                                        database=None):
+        return self.client.query_and_get_answer_with_error(sql, stdin=stdin, timeout=timeout, settings=settings,
+                                                           user=user, password=password, database=database)
 
     # Connects to the instance via HTTP interface, sends a query and returns the answer
     def http_query(self, sql, data=None, params=None, user=None, password=None, expect_fail_and_get_error=False):
@@ -900,7 +929,8 @@ class ClickHouseInstance:
         open_result = urllib.urlopen(url, data)
 
         def http_code_and_message():
-            return str(open_result.getcode()) + " " + httplib.responses[open_result.getcode()] + ": " + open_result.read()
+            return str(open_result.getcode()) + " " + httplib.responses[
+                open_result.getcode()] + ": " + open_result.read()
 
         if expect_fail_and_get_error:
             if open_result.getcode() == 200:
@@ -913,18 +943,19 @@ class ClickHouseInstance:
 
     # Connects to the instance via HTTP interface, sends a query and returns the answer
     def http_request(self, url, method='GET', params=None, data=None, headers=None):
-        url = "http://" + self.ip_address + ":8123/"+url
+        url = "http://" + self.ip_address + ":8123/" + url
         return requests.request(method=method, url=url, params=params, data=data, headers=headers)
 
     # Connects to the instance via HTTP interface, sends a query, expects an error and return the error message
     def http_query_and_get_error(self, sql, data=None, params=None, user=None, password=None):
-        return self.http_query(sql=sql, data=data, params=params, user=user, password=password, expect_fail_and_get_error=True)
+        return self.http_query(sql=sql, data=data, params=params, user=user, password=password,
+                               expect_fail_and_get_error=True)
 
     def kill_clickhouse(self, stop_start_wait_sec=5):
         pid = self.get_process_pid("clickhouse")
         if not pid:
             raise Exception("No clickhouse found")
-        self.exec_in_container(["bash",  "-c", "kill -9 {}".format(pid)], user='root')
+        self.exec_in_container(["bash", "-c", "kill -9 {}".format(pid)], user='root')
         time.sleep(stop_start_wait_sec)
 
     def restore_clickhouse(self, retries=100):
@@ -1030,7 +1061,8 @@ class ClickHouseInstance:
             time_left = deadline - current_time
             if deadline is not None and current_time >= deadline:
                 raise Exception("Timed out while waiting for instance `{}' with ip address {} to start. "
-                                "Container status: {}, logs: {}".format(self.name, self.ip_address, status, handle.logs()))
+                                "Container status: {}, logs: {}".format(self.name, self.ip_address, status,
+                                                                        handle.logs()))
 
             # Repeatedly poll the instance address until there is something that listens there.
             # Usually it means that ClickHouse is ready to accept queries.
diff --git a/tests/integration/helpers/dictionary.py b/tests/integration/helpers/dictionary.py
index 805726a0d47..b3f7a729777 100644
--- a/tests/integration/helpers/dictionary.py
+++ b/tests/integration/helpers/dictionary.py
@@ -59,7 +59,8 @@ class Row(object):
 
 
 class Field(object):
-    def __init__(self, name, field_type, is_key=False, is_range_key=False, default=None, hierarchical=False, range_hash_type=None, default_value_for_get=None):
+    def __init__(self, name, field_type, is_key=False, is_range_key=False, default=None, hierarchical=False,
+                 range_hash_type=None, default_value_for_get=None):
         self.name = name
         self.field_type = field_type
         self.is_key = is_key
@@ -123,7 +124,8 @@ class DictionaryStructure(object):
                 self.range_key = field
 
         if not self.layout.is_complex and len(self.keys) > 1:
-            raise Exception("More than one key {} field in non complex layout {}".format(len(self.keys), self.layout.name))
+            raise Exception(
+                "More than one key {} field in non complex layout {}".format(len(self.keys), self.layout.name))
 
         if self.layout.is_ranged and (not self.range_key or len(self.range_fields) != 2):
             raise Exception("Inconsistent configuration of ranged dictionary")
@@ -213,7 +215,8 @@ class DictionaryStructure(object):
         if or_default:
             or_default_expr = 'OrDefault'
             if field.default_value_for_get is None:
-                raise Exception("Can create 'dictGetOrDefault' query for field {} without default_value_for_get".format(field.name))
+                raise Exception(
+                    "Can create 'dictGetOrDefault' query for field {} without default_value_for_get".format(field.name))
 
             val = field.default_value_for_get
             if isinstance(val, str):
@@ -259,15 +262,16 @@ class DictionaryStructure(object):
     def get_get_or_default_expressions(self, dict_name, field, row):
         if not self.layout.is_ranged:
             return [
-                self._get_dict_get_common_expression(dict_name, field, row, or_default=True, with_type=False, has=False),
+                self._get_dict_get_common_expression(dict_name, field, row, or_default=True, with_type=False,
+                                                     has=False),
                 self._get_dict_get_common_expression(dict_name, field, row, or_default=True, with_type=True, has=False),
             ]
         return []
 
-
     def get_has_expressions(self, dict_name, field, row):
         if not self.layout.is_ranged:
-            return [self._get_dict_get_common_expression(dict_name, field, row, or_default=False, with_type=False, has=True)]
+            return [self._get_dict_get_common_expression(dict_name, field, row, or_default=False, with_type=False,
+                                                         has=True)]
         return []
 
     def get_hierarchical_expressions(self, dict_name, row):
@@ -290,7 +294,7 @@ class DictionaryStructure(object):
                 "dictIsIn('{dict_name}', {child_key}, {parent_key})".format(
                     dict_name=dict_name,
                     child_key=child_key_expr,
-                    parent_key=parent_key_expr,)
+                    parent_key=parent_key_expr, )
             ]
 
         return []
@@ -364,7 +368,8 @@ class Dictionary(object):
         return ['select {}'.format(expr) for expr in self.structure.get_get_expressions(self.name, field, row)]
 
     def get_select_get_or_default_queries(self, field, row):
-        return ['select {}'.format(expr) for expr in self.structure.get_get_or_default_expressions(self.name, field, row)]
+        return ['select {}'.format(expr) for expr in
+                self.structure.get_get_or_default_expressions(self.name, field, row)]
 
     def get_select_has_queries(self, field, row):
         return ['select {}'.format(expr) for expr in self.structure.get_has_expressions(self.name, field, row)]
diff --git a/tests/integration/helpers/external_sources.py b/tests/integration/helpers/external_sources.py
index 5e8d420ff94..0d01a1bcbfd 100644
--- a/tests/integration/helpers/external_sources.py
+++ b/tests/integration/helpers/external_sources.py
@@ -1,14 +1,15 @@
 # -*- coding: utf-8 -*-
-import warnings
-import pymysql.cursors
-import pymongo
-import cassandra.cluster
-import redis
-import aerospike
-from tzlocal import get_localzone
 import datetime
 import os
 import uuid
+import warnings
+
+import aerospike
+import cassandra.cluster
+import pymongo
+import pymysql.cursors
+import redis
+from tzlocal import get_localzone
 
 
 class ExternalSource(object):
@@ -89,12 +90,12 @@ class SourceMySQL(ExternalSource):
                     <db>test</db>
                     <table>{tbl}</table>
                 </mysql>'''.format(
-                hostname=self.docker_hostname,
-                port=self.docker_port,
-                user=self.user,
-                password=self.password,
-                tbl=table_name,
-            )
+            hostname=self.docker_hostname,
+            port=self.docker_port,
+            user=self.user,
+            password=self.password,
+            tbl=table_name,
+        )
 
     def prepare(self, structure, table_name, cluster):
         self.create_mysql_conn()
@@ -160,7 +161,8 @@ class SourceMongo(ExternalSource):
             if field.field_type == "Date":
                 self.converters[field.name] = lambda x: datetime.datetime.strptime(x, "%Y-%m-%d")
             elif field.field_type == "DateTime":
-                self.converters[field.name] = lambda x: get_localzone().localize(datetime.datetime.strptime(x, "%Y-%m-%d %H:%M:%S"))
+                self.converters[field.name] = lambda x: get_localzone().localize(
+                    datetime.datetime.strptime(x, "%Y-%m-%d %H:%M:%S"))
             else:
                 self.converters[field.name] = lambda x: x
 
@@ -180,6 +182,7 @@ class SourceMongo(ExternalSource):
 
         result = tbl.insert_many(to_insert)
 
+
 class SourceMongoURI(SourceMongo):
     def compatible_with_layout(self, layout):
         # It is enough to test one layout for this dictionary, since we're
@@ -200,6 +203,7 @@ class SourceMongoURI(SourceMongo):
             tbl=table_name,
         )
 
+
 class SourceClickHouse(ExternalSource):
 
     def get_source_str(self, table_name):
@@ -284,7 +288,8 @@ class SourceFile(ExternalSource):
                 sorted_row.append(str(row.data[name]))
 
             str_data = '\t'.join(sorted_row)
-            self.node.exec_in_container(["bash", "-c", "echo \"{row}\" >> {fname}".format(row=str_data, fname=path)], user="root")
+            self.node.exec_in_container(["bash", "-c", "echo \"{row}\" >> {fname}".format(row=str_data, fname=path)],
+                                        user="root")
 
     def compatible_with_layout(self, layout):
         return 'cache' not in layout.name and 'direct' not in layout.name
@@ -324,7 +329,8 @@ class _SourceExecutableBase(ExternalSource):
                 sorted_row.append(str(row.data[name]))
 
             str_data = '\t'.join(sorted_row)
-            self.node.exec_in_container(["bash", "-c", "echo \"{row}\" >> {fname}".format(row=str_data, fname=path)], user='root')
+            self.node.exec_in_container(["bash", "-c", "echo \"{row}\" >> {fname}".format(row=str_data, fname=path)],
+                                        user='root')
 
 
 class SourceExecutableCache(_SourceExecutableBase):
@@ -344,12 +350,14 @@ class SourceExecutableHashed(_SourceExecutableBase):
     def compatible_with_layout(self, layout):
         return 'cache' in layout.name
 
-class SourceHTTPBase(ExternalSource):
 
+class SourceHTTPBase(ExternalSource):
     PORT_COUNTER = 5555
+
     def get_source_str(self, table_name):
         self.http_port = SourceHTTPBase.PORT_COUNTER
-        url = "{schema}://{host}:{port}/".format(schema=self._get_schema(), host=self.docker_hostname, port=self.http_port)
+        url = "{schema}://{host}:{port}/".format(schema=self._get_schema(), host=self.docker_hostname,
+                                                 port=self.http_port)
         SourceHTTPBase.PORT_COUNTER += 1
         return '''
             <http>
@@ -395,7 +403,8 @@ class SourceHTTPBase(ExternalSource):
                 sorted_row.append(str(row.data[name]))
 
             str_data = '\t'.join(sorted_row)
-            self.node.exec_in_container(["bash", "-c", "echo \"{row}\" >> {fname}".format(row=str_data, fname=path)], user='root')
+            self.node.exec_in_container(["bash", "-c", "echo \"{row}\" >> {fname}".format(row=str_data, fname=path)],
+                                        user='root')
 
 
 class SourceHTTP(SourceHTTPBase):
@@ -407,6 +416,7 @@ class SourceHTTPS(SourceHTTPBase):
     def _get_schema(self):
         return "https"
 
+
 class SourceCassandra(ExternalSource):
     TYPE_MAPPING = {
         'UInt8': 'tinyint',
@@ -426,7 +436,8 @@ class SourceCassandra(ExternalSource):
     }
 
     def __init__(self, name, internal_hostname, internal_port, docker_hostname, docker_port, user, password):
-        ExternalSource.__init__(self, name, internal_hostname, internal_port, docker_hostname, docker_port, user, password)
+        ExternalSource.__init__(self, name, internal_hostname, internal_port, docker_hostname, docker_port, user,
+                                password)
         self.structure = dict()
 
     def get_source_str(self, table_name):
@@ -448,13 +459,14 @@ class SourceCassandra(ExternalSource):
     def prepare(self, structure, table_name, cluster):
         self.client = cassandra.cluster.Cluster([self.internal_hostname], port=self.internal_port)
         self.session = self.client.connect()
-        self.session.execute("create keyspace if not exists test with replication = {'class': 'SimpleStrategy', 'replication_factor' : 1};")
+        self.session.execute(
+            "create keyspace if not exists test with replication = {'class': 'SimpleStrategy', 'replication_factor' : 1};")
         self.session.execute('drop table if exists test."{}"'.format(table_name))
         self.structure[table_name] = structure
         columns = ['"' + col.name + '" ' + self.TYPE_MAPPING[col.field_type] for col in structure.get_all_fields()]
         keys = ['"' + col.name + '"' for col in structure.keys]
         query = 'create table test."{name}" ({columns}, primary key ({pk}));'.format(
-                name=table_name, columns=', '.join(columns),  pk=', '.join(keys))
+            name=table_name, columns=', '.join(columns), pk=', '.join(keys))
         self.session.execute(query)
         self.prepared = True
 
@@ -470,14 +482,16 @@ class SourceCassandra(ExternalSource):
         names_and_types = [(field.name, field.field_type) for field in self.structure[table_name].get_all_fields()]
         columns = ['"' + col[0] + '"' for col in names_and_types]
         insert = 'insert into test."{table}" ({columns}) values ({args})'.format(
-                table=table_name, columns=','.join(columns), args=','.join(['%s']*len(columns)))
+            table=table_name, columns=','.join(columns), args=','.join(['%s'] * len(columns)))
         for row in data:
             values = [self.get_value_to_insert(row.get_value_by_name(col[0]), col[1]) for col in names_and_types]
             self.session.execute(insert, values)
 
+
 class SourceRedis(ExternalSource):
     def __init__(
-            self, name, internal_hostname, internal_port, docker_hostname, docker_port, user, password, db_index, storage_type
+            self, name, internal_hostname, internal_port, docker_hostname, docker_port, user, password, db_index,
+            storage_type
     ):
         super(SourceRedis, self).__init__(
             name, internal_hostname, internal_port, docker_hostname, docker_port, user, password
@@ -503,7 +517,8 @@ class SourceRedis(ExternalSource):
         )
 
     def prepare(self, structure, table_name, cluster):
-        self.client = redis.StrictRedis(host=self.internal_hostname, port=self.internal_port, db=self.db_index, password=self.password or None)
+        self.client = redis.StrictRedis(host=self.internal_hostname, port=self.internal_port, db=self.db_index,
+                                        password=self.password or None)
         self.prepared = True
         self.ordered_names = structure.get_ordered_names()
 
@@ -521,11 +536,12 @@ class SourceRedis(ExternalSource):
     def compatible_with_layout(self, layout):
         return layout.is_simple and self.storage_type == "simple" or layout.is_complex and self.storage_type == "hash_map"
 
+
 class SourceAerospike(ExternalSource):
     def __init__(self, name, internal_hostname, internal_port,
                  docker_hostname, docker_port, user, password):
         ExternalSource.__init__(self, name, internal_hostname, internal_port,
-                 docker_hostname, docker_port, user, password)
+                                docker_hostname, docker_port, user, password)
         self.namespace = "test"
         self.set = "test_set"
 
@@ -543,7 +559,7 @@ class SourceAerospike(ExternalSource):
 
     def prepare(self, structure, table_name, cluster):
         config = {
-            'hosts': [ (self.internal_hostname, self.internal_port) ]
+            'hosts': [(self.internal_hostname, self.internal_port)]
         }
         self.client = aerospike.client(config).connect()
         self.prepared = True
@@ -580,7 +596,7 @@ class SourceAerospike(ExternalSource):
                 self.client.put(key, {"bin_value": value[1]}, policy={"key": aerospike.POLICY_KEY_SEND})
                 assert self.client.exists(key)
         else:
-            assert("VALUES SIZE != 2")
+            assert ("VALUES SIZE != 2")
 
         # print(values)
 
diff --git a/tests/integration/helpers/hdfs_api.py b/tests/integration/helpers/hdfs_api.py
index 97df8a13aeb..70111045ad2 100644
--- a/tests/integration/helpers/hdfs_api.py
+++ b/tests/integration/helpers/hdfs_api.py
@@ -1,10 +1,12 @@
-#-*- coding: utf-8 -*-
+# -*- coding: utf-8 -*-
 import StringIO
 import gzip
-import requests
 import subprocess
 from tempfile import NamedTemporaryFile
 
+import requests
+
+
 class HDFSApi(object):
     def __init__(self, user):
         self.host = "localhost"
@@ -13,11 +15,15 @@ class HDFSApi(object):
         self.user = user
 
     def read_data(self, path):
-        response = requests.get("http://{host}:{port}/webhdfs/v1{path}?op=OPEN".format(host=self.host, port=self.http_proxy_port, path=path), allow_redirects=False)
+        response = requests.get(
+            "http://{host}:{port}/webhdfs/v1{path}?op=OPEN".format(host=self.host, port=self.http_proxy_port,
+                                                                   path=path), allow_redirects=False)
         if response.status_code != 307:
             response.raise_for_status()
         additional_params = '&'.join(response.headers['Location'].split('&')[1:2])
-        response_data = requests.get("http://{host}:{port}/webhdfs/v1{path}?op=OPEN&{params}".format(host=self.host, port=self.http_data_port, path=path, params=additional_params))
+        response_data = requests.get(
+            "http://{host}:{port}/webhdfs/v1{path}?op=OPEN&{params}".format(host=self.host, port=self.http_data_port,
+                                                                            path=path, params=additional_params))
         if response_data.status_code != 200:
             response_data.raise_for_status()
 
@@ -25,7 +31,9 @@ class HDFSApi(object):
 
     # Requests can't put file
     def _curl_to_put(self, filename, path, params):
-        url = "http://{host}:{port}/webhdfs/v1{path}?op=CREATE&{params}".format(host=self.host, port=self.http_data_port, path=path, params=params)
+        url = "http://{host}:{port}/webhdfs/v1{path}?op=CREATE&{params}".format(host=self.host,
+                                                                                port=self.http_data_port, path=path,
+                                                                                params=params)
         cmd = "curl -s -i -X PUT -T {fname} '{url}'".format(fname=filename, url=url)
         output = subprocess.check_output(cmd, shell=True)
         return output
@@ -36,13 +44,15 @@ class HDFSApi(object):
         named_file.write(content)
         named_file.flush()
         response = requests.put(
-            "http://{host}:{port}/webhdfs/v1{path}?op=CREATE".format(host=self.host, port=self.http_proxy_port, path=path, user=self.user),
+            "http://{host}:{port}/webhdfs/v1{path}?op=CREATE".format(host=self.host, port=self.http_proxy_port,
+                                                                     path=path, user=self.user),
             allow_redirects=False
         )
         if response.status_code != 307:
             response.raise_for_status()
 
-        additional_params = '&'.join(response.headers['Location'].split('&')[1:2] + ["user.name={}".format(self.user), "overwrite=true"])
+        additional_params = '&'.join(
+            response.headers['Location'].split('&')[1:2] + ["user.name={}".format(self.user), "overwrite=true"])
         output = self._curl_to_put(fpath, path, additional_params)
         if "201 Created" not in output:
             raise Exception("Can't create file on hdfs:\n {}".format(output))
diff --git a/tests/integration/helpers/http_server.py b/tests/integration/helpers/http_server.py
index dd268b3a417..83e134606e3 100644
--- a/tests/integration/helpers/http_server.py
+++ b/tests/integration/helpers/http_server.py
@@ -1,9 +1,9 @@
 # -*- coding: utf-8 -*-
 import argparse
-from BaseHTTPServer import BaseHTTPRequestHandler, HTTPServer
+import csv
 import socket
 import ssl
-import csv
+from BaseHTTPServer import BaseHTTPRequestHandler, HTTPServer
 
 
 # Decorator used to see if authentication works for external dictionary who use a HTTP source.
@@ -15,6 +15,7 @@ def check_auth(fn):
             req.send_response(401)
         else:
             fn(req)
+
     return wrapper
 
 
@@ -37,7 +38,7 @@ def start_server(server_address, data_path, schema, cert_path, address_family):
             self.send_header('Content-type', 'text/tsv')
             self.end_headers()
 
-        def __send_data(self, only_ids = None):
+        def __send_data(self, only_ids=None):
             with open(data_path, 'r') as fl:
                 reader = csv.reader(fl, delimiter='\t')
                 for row in reader:
diff --git a/tests/integration/helpers/network.py b/tests/integration/helpers/network.py
index f5c2b4f8d19..f6505e81c91 100644
--- a/tests/integration/helpers/network.py
+++ b/tests/integration/helpers/network.py
@@ -1,12 +1,9 @@
-import os.path as p
+import os
 import subprocess
 import time
-import os
 
 import docker
 
-from .cluster import CLICKHOUSE_ROOT_DIR
-
 
 class PartitionManager:
     """Allows introducing failures in the network between docker containers.
@@ -23,21 +20,18 @@ class PartitionManager:
     def __init__(self):
         self._iptables_rules = []
 
-
     def drop_instance_zk_connections(self, instance, action='DROP'):
         self._check_instance(instance)
 
         self._add_rule({'source': instance.ip_address, 'destination_port': 2181, 'action': action})
         self._add_rule({'destination': instance.ip_address, 'source_port': 2181, 'action': action})
 
-
     def restore_instance_zk_connections(self, instance, action='DROP'):
         self._check_instance(instance)
 
         self._delete_rule({'source': instance.ip_address, 'destination_port': 2181, 'action': action})
         self._delete_rule({'destination': instance.ip_address, 'source_port': 2181, 'action': action})
 
-
     def partition_instances(self, left, right, port=None, action='DROP'):
         self._check_instance(left)
         self._check_instance(right)
@@ -51,7 +45,6 @@ class PartitionManager:
         self._add_rule(create_rule(left, right))
         self._add_rule(create_rule(right, left))
 
-
     def heal_all(self):
         while self._iptables_rules:
             rule = self._iptables_rules.pop()
@@ -66,7 +59,6 @@ class PartitionManager:
         for rule in rules:
             self._add_rule(rule)
 
-
     @staticmethod
     def _check_instance(instance):
         if instance.ip_address is None:
@@ -152,7 +144,6 @@ class _NetworkManager:
             ret.extend(['-j'] + action.split())
         return ret
 
-
     def __init__(
             self,
             container_expire_timeout=50, container_exit_timeout=60):
@@ -175,7 +166,8 @@ class _NetworkManager:
                 except docker.errors.NotFound:
                     pass
 
-            self._container = self._docker_client.containers.run('yandex/clickhouse-integration-helper', auto_remove=True,
+            self._container = self._docker_client.containers.run('yandex/clickhouse-integration-helper',
+                                                                 auto_remove=True,
                                                                  command=('sleep %s' % self.container_exit_timeout),
                                                                  detach=True, network_mode='host')
             container_id = self._container.id
diff --git a/tests/integration/helpers/test_tools.py b/tests/integration/helpers/test_tools.py
index 67ca025c58a..d196142c518 100644
--- a/tests/integration/helpers/test_tools.py
+++ b/tests/integration/helpers/test_tools.py
@@ -1,6 +1,7 @@
 import difflib
 import time
 
+
 class TSV:
     """Helper to get pretty diffs between expected and actual tab-separated value files"""
 
@@ -40,17 +41,22 @@ class TSV:
     def toMat(contents):
         return [line.split("\t") for line in contents.split("\n") if line.strip()]
 
-def assert_eq_with_retry(instance, query, expectation, retry_count=20, sleep_time=0.5, stdin=None, timeout=None, settings=None, user=None, ignore_error=False):
+
+def assert_eq_with_retry(instance, query, expectation, retry_count=20, sleep_time=0.5, stdin=None, timeout=None,
+                         settings=None, user=None, ignore_error=False):
     expectation_tsv = TSV(expectation)
     for i in xrange(retry_count):
         try:
-            if TSV(instance.query(query, user=user, stdin=stdin, timeout=timeout, settings=settings, ignore_error=ignore_error)) == expectation_tsv:
+            if TSV(instance.query(query, user=user, stdin=stdin, timeout=timeout, settings=settings,
+                                  ignore_error=ignore_error)) == expectation_tsv:
                 break
             time.sleep(sleep_time)
         except Exception as ex:
             print "assert_eq_with_retry retry {} exception {}".format(i + 1, ex)
             time.sleep(sleep_time)
     else:
-        val = TSV(instance.query(query, user=user, stdin=stdin, timeout=timeout, settings=settings, ignore_error=ignore_error))
+        val = TSV(instance.query(query, user=user, stdin=stdin, timeout=timeout, settings=settings,
+                                 ignore_error=ignore_error))
         if expectation_tsv != val:
-            raise AssertionError("'{}' != '{}'\n{}".format(expectation_tsv, val, '\n'.join(expectation_tsv.diff(val, n1="expectation", n2="query"))))
+            raise AssertionError("'{}' != '{}'\n{}".format(expectation_tsv, val, '\n'.join(
+                expectation_tsv.diff(val, n1="expectation", n2="query"))))
diff --git a/tests/integration/helpers/uclient.py b/tests/integration/helpers/uclient.py
index 6318802d81a..098e17a38da 100644
--- a/tests/integration/helpers/uclient.py
+++ b/tests/integration/helpers/uclient.py
@@ -11,9 +11,10 @@ import uexpect
 prompt = ':\) '
 end_of_block = r'.*\r\n.*\r\n'
 
+
 class client(object):
     def __init__(self, command=None, name='', log=None):
-        self.client = uexpect.spawn(['/bin/bash','--noediting'])
+        self.client = uexpect.spawn(['/bin/bash', '--noediting'])
         if command is None:
             command = '/usr/bin/clickhouse-client'
         self.client.command = command
diff --git a/tests/integration/helpers/uexpect.py b/tests/integration/helpers/uexpect.py
index f71b32a53e1..873d9a749e0 100644
--- a/tests/integration/helpers/uexpect.py
+++ b/tests/integration/helpers/uexpect.py
@@ -13,13 +13,12 @@
 # limitations under the License.
 import os
 import pty
-import time
-import sys
 import re
-
-from threading import Thread, Event
-from subprocess import Popen
+import time
 from Queue import Queue, Empty
+from subprocess import Popen
+from threading import Thread, Event
+
 
 class TimeoutError(Exception):
     def __init__(self, timeout):
@@ -28,6 +27,7 @@ class TimeoutError(Exception):
     def __str__(self):
         return 'Timeout %.3fs' % float(self.timeout)
 
+
 class ExpectTimeoutError(Exception):
     def __init__(self, pattern, timeout, buffer):
         self.pattern = pattern
@@ -43,6 +43,7 @@ class ExpectTimeoutError(Exception):
             s += 'or \'%s\'' % ','.join(['%x' % ord(c) for c in self.buffer[:]])
         return s
 
+
 class IO(object):
     class EOF(object):
         pass
@@ -59,7 +60,7 @@ class IO(object):
             self._prefix = prefix
 
         def write(self, data):
-            self._logger.write(('\n' + data).replace('\n','\n' + self._prefix))
+            self._logger.write(('\n' + data).replace('\n', '\n' + self._prefix))
 
         def flush(self):
             self._logger.flush()
@@ -165,7 +166,7 @@ class IO(object):
         data = ''
         timeleft = timeout
         try:
-            while timeleft >= 0 :
+            while timeleft >= 0:
                 start_time = time.time()
                 data += self.queue.get(timeout=timeleft)
                 if data:
@@ -182,6 +183,7 @@ class IO(object):
 
         return data
 
+
 def spawn(command):
     master, slave = pty.openpty()
     process = Popen(command, preexec_fn=os.setsid, stdout=slave, stdin=slave, stderr=slave, bufsize=1)
@@ -193,7 +195,8 @@ def spawn(command):
     thread.daemon = True
     thread.start()
 
-    return IO(process, master, queue, reader={'thread':thread, 'kill_event':reader_kill_event})
+    return IO(process, master, queue, reader={'thread': thread, 'kill_event': reader_kill_event})
+
 
 def reader(process, out, queue, kill_event):
     while True:
diff --git a/tests/integration/test_SYSTEM_FLUSH_LOGS/test.py b/tests/integration/test_SYSTEM_FLUSH_LOGS/test.py
index 7e8f2000bca..6dc843e101a 100644
--- a/tests/integration/test_SYSTEM_FLUSH_LOGS/test.py
+++ b/tests/integration/test_SYSTEM_FLUSH_LOGS/test.py
@@ -24,6 +24,7 @@ system_logs = [
 # decrease timeout for the test to show possible issues.
 timeout = pytest.mark.timeout(30)
 
+
 @pytest.fixture(scope='module', autouse=True)
 def start_cluster():
     try:
@@ -32,10 +33,12 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 @pytest.fixture(scope='function')
 def flush_logs():
     node.query('SYSTEM FLUSH LOGS')
 
+
 @timeout
 @pytest.mark.parametrize('table,exists', system_logs)
 def test_system_logs(flush_logs, table, exists):
@@ -45,6 +48,7 @@ def test_system_logs(flush_logs, table, exists):
     else:
         assert "Table {} doesn't exist".format(table) in node.query_and_get_error(q)
 
+
 # Logic is tricky, let's check that there is no hang in case of message queue
 # is not empty (this is another code path in the code).
 @timeout
diff --git a/tests/integration/test_access_control_on_cluster/test.py b/tests/integration/test_access_control_on_cluster/test.py
index 9f053afb607..e804be2c94e 100644
--- a/tests/integration/test_access_control_on_cluster/test.py
+++ b/tests/integration/test_access_control_on_cluster/test.py
@@ -1,13 +1,12 @@
-import time
 import pytest
 from helpers.cluster import ClickHouseCluster
-from helpers.client import QueryRuntimeException
 
 cluster = ClickHouseCluster(__file__)
 ch1 = cluster.add_instance('ch1', main_configs=["configs/config.d/clusters.xml"], with_zookeeper=True)
 ch2 = cluster.add_instance('ch2', main_configs=["configs/config.d/clusters.xml"], with_zookeeper=True)
 ch3 = cluster.add_instance('ch3', main_configs=["configs/config.d/clusters.xml"], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module", autouse=True)
 def started_cluster():
     try:
diff --git a/tests/integration/test_adaptive_granularity/test.py b/tests/integration/test_adaptive_granularity/test.py
index d5ac91671e0..0c5d7bcb63c 100644
--- a/tests/integration/test_adaptive_granularity/test.py
+++ b/tests/integration/test_adaptive_granularity/test.py
@@ -1,31 +1,50 @@
 import time
+
 import pytest
-
-from helpers.cluster import ClickHouseCluster
-from multiprocessing.dummy import Pool
 from helpers.client import QueryRuntimeException, QueryTimeoutExceedException
-
+from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
-
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
-node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                             with_zookeeper=True)
+node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                             with_zookeeper=True)
 
-node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.6.3.18', with_installed_binary=True)
-node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                             with_zookeeper=True, image='yandex/clickhouse-server', tag='19.6.3.18',
+                             with_installed_binary=True)
+node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                             with_zookeeper=True)
 
-node5 = cluster.add_instance('node5', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15', with_installed_binary=True)
-node6 = cluster.add_instance('node6', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+node5 = cluster.add_instance('node5', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                             with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15',
+                             with_installed_binary=True)
+node6 = cluster.add_instance('node6', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                             with_zookeeper=True)
 
-node7 = cluster.add_instance('node7', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.6.3.18', stay_alive=True, with_installed_binary=True)
-node8 = cluster.add_instance('node8', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15', stay_alive=True, with_installed_binary=True)
+node7 = cluster.add_instance('node7', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                             with_zookeeper=True, image='yandex/clickhouse-server', tag='19.6.3.18', stay_alive=True,
+                             with_installed_binary=True)
+node8 = cluster.add_instance('node8', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                             with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15', stay_alive=True,
+                             with_installed_binary=True)
 
-node9 = cluster.add_instance('node9', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml', 'configs/merge_tree_settings.xml'], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15', stay_alive=True, with_installed_binary=True)
-node10 = cluster.add_instance('node10', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml', 'configs/merge_tree_settings.xml'], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.6.3.18', stay_alive=True, with_installed_binary=True)
+node9 = cluster.add_instance('node9', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml',
+                                                    'configs/merge_tree_settings.xml'], with_zookeeper=True,
+                             image='yandex/clickhouse-server', tag='19.1.15', stay_alive=True,
+                             with_installed_binary=True)
+node10 = cluster.add_instance('node10', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml',
+                                                      'configs/merge_tree_settings.xml'], with_zookeeper=True,
+                              image='yandex/clickhouse-server', tag='19.6.3.18', stay_alive=True,
+                              with_installed_binary=True)
 
-node11 = cluster.add_instance('node11', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15', stay_alive=True, with_installed_binary=True)
-node12 = cluster.add_instance('node12', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15', stay_alive=True, with_installed_binary=True)
+node11 = cluster.add_instance('node11', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                              with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15', stay_alive=True,
+                              with_installed_binary=True)
+node12 = cluster.add_instance('node12', main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'],
+                              with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.15', stay_alive=True,
+                              with_installed_binary=True)
 
 
 def prepare_single_pair_with_setting(first_node, second_node, group):
@@ -34,80 +53,80 @@ def prepare_single_pair_with_setting(first_node, second_node, group):
 
     # Two tables with adaptive granularity
     first_node.query(
-    '''
-        CREATE TABLE table_by_default(date Date, id UInt32, dummy UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_by_default', '1')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-        SETTINGS index_granularity_bytes = 10485760
-    '''.format(g=group))
-
-    second_node.query(
-    '''
-        CREATE TABLE table_by_default(date Date, id UInt32, dummy UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_by_default', '2')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-        SETTINGS index_granularity_bytes = 10485760
-    '''.format(g=group))
-
-    # Two tables with fixed granularity
-    first_node.query(
-    '''
-        CREATE TABLE table_with_fixed_granularity(date Date, id UInt32, dummy UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_fixed_granularity', '1')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-        SETTINGS index_granularity_bytes = 0
-    '''.format(g=group))
-
-    second_node.query(
-    '''
-        CREATE TABLE table_with_fixed_granularity(date Date, id UInt32, dummy UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_fixed_granularity', '2')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-        SETTINGS index_granularity_bytes = 0
-    '''.format(g=group))
-
-    # Two tables with different granularity
-    with pytest.raises(QueryRuntimeException):
-        first_node.query(
         '''
-            CREATE TABLE table_with_different_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_different_granularity', '1')
+            CREATE TABLE table_by_default(date Date, id UInt32, dummy UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_by_default', '1')
             PARTITION BY toYYYYMM(date)
             ORDER BY id
             SETTINGS index_granularity_bytes = 10485760
         '''.format(g=group))
 
-        second_node.query(
+    second_node.query(
         '''
-            CREATE TABLE table_with_different_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_different_granularity', '2')
+            CREATE TABLE table_by_default(date Date, id UInt32, dummy UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_by_default', '2')
+            PARTITION BY toYYYYMM(date)
+            ORDER BY id
+            SETTINGS index_granularity_bytes = 10485760
+        '''.format(g=group))
+
+    # Two tables with fixed granularity
+    first_node.query(
+        '''
+            CREATE TABLE table_with_fixed_granularity(date Date, id UInt32, dummy UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_fixed_granularity', '1')
             PARTITION BY toYYYYMM(date)
             ORDER BY id
             SETTINGS index_granularity_bytes = 0
         '''.format(g=group))
 
-        # Two tables with different granularity, but enabled mixed parts
-        first_node.query(
+    second_node.query(
         '''
-            CREATE TABLE table_with_mixed_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_mixed_granularity', '1')
+            CREATE TABLE table_with_fixed_granularity(date Date, id UInt32, dummy UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_fixed_granularity', '2')
             PARTITION BY toYYYYMM(date)
             ORDER BY id
-            SETTINGS index_granularity_bytes = 10485760, enable_mixed_granularity_parts=1
+            SETTINGS index_granularity_bytes = 0
         '''.format(g=group))
 
+    # Two tables with different granularity
+    with pytest.raises(QueryRuntimeException):
+        first_node.query(
+            '''
+                CREATE TABLE table_with_different_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_different_granularity', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+                SETTINGS index_granularity_bytes = 10485760
+            '''.format(g=group))
+
         second_node.query(
-        '''
-            CREATE TABLE table_with_mixed_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_mixed_granularity', '2')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-            SETTINGS index_granularity_bytes = 0, enable_mixed_granularity_parts=1
-        '''.format(g=group))
+            '''
+                CREATE TABLE table_with_different_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_different_granularity', '2')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+                SETTINGS index_granularity_bytes = 0
+            '''.format(g=group))
+
+        # Two tables with different granularity, but enabled mixed parts
+        first_node.query(
+            '''
+                CREATE TABLE table_with_mixed_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_mixed_granularity', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+                SETTINGS index_granularity_bytes = 10485760, enable_mixed_granularity_parts=1
+            '''.format(g=group))
+
+        second_node.query(
+            '''
+                CREATE TABLE table_with_mixed_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_mixed_granularity', '2')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+                SETTINGS index_granularity_bytes = 0, enable_mixed_granularity_parts=1
+            '''.format(g=group))
 
 
 def prepare_single_pair_without_setting(first_node, second_node, group):
@@ -116,21 +135,21 @@ def prepare_single_pair_without_setting(first_node, second_node, group):
 
     # Two tables with fixed granularity
     first_node.query(
-    '''
-        CREATE TABLE table_with_fixed_granularity(date Date, id UInt32, dummy UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_fixed_granularity', '1')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-    '''.format(g=group))
+        '''
+            CREATE TABLE table_with_fixed_granularity(date Date, id UInt32, dummy UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_fixed_granularity', '1')
+            PARTITION BY toYYYYMM(date)
+            ORDER BY id
+        '''.format(g=group))
 
     second_node.query(
-    '''
-        CREATE TABLE table_with_fixed_granularity(date Date, id UInt32, dummy UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_fixed_granularity', '2')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-        SETTINGS index_granularity_bytes = 0
-    '''.format(g=group))
+        '''
+            CREATE TABLE table_with_fixed_granularity(date Date, id UInt32, dummy UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{g}/table_with_fixed_granularity', '2')
+            PARTITION BY toYYYYMM(date)
+            ORDER BY id
+            SETTINGS index_granularity_bytes = 0
+        '''.format(g=group))
 
 
 @pytest.fixture(scope="module")
@@ -160,7 +179,8 @@ def start_static_cluster():
 def test_different_versions_cluster(start_static_cluster, first_node, second_node, table):
     counter = 1
     for n1, n2 in ((first_node, second_node), (second_node, first_node)):
-        n1.query("INSERT INTO {tbl} VALUES (toDate('2018-10-01'), {c1}, 333), (toDate('2018-10-02'), {c2}, 444)".format(tbl=table, c1=counter * 2, c2=counter * 2 + 1))
+        n1.query("INSERT INTO {tbl} VALUES (toDate('2018-10-01'), {c1}, 333), (toDate('2018-10-02'), {c2}, 444)".format(
+            tbl=table, c1=counter * 2, c2=counter * 2 + 1))
         n2.query("SYSTEM SYNC REPLICA {tbl}".format(tbl=table))
         assert_eq_with_retry(n2, "SELECT count() from {tbl}".format(tbl=table), str(counter * 2))
         n1.query("DETACH TABLE {tbl}".format(tbl=table))
@@ -175,73 +195,74 @@ def test_different_versions_cluster(start_static_cluster, first_node, second_nod
         assert_eq_with_retry(n2, "SELECT count() from {tbl}".format(tbl=table), str(counter * 2))
         counter += 1
 
+
 @pytest.fixture(scope="module")
 def start_dynamic_cluster():
     try:
         cluster.start()
         node7.query(
-        '''
-            CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/7/table_with_default_granularity', '1')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-        ''')
+            '''
+                CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/7/table_with_default_granularity', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+            ''')
 
         node7.query(
-        '''
-            CREATE TABLE table_with_adaptive_default_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/7/table_with_adaptive_default_granularity', '1')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-            SETTINGS index_granularity_bytes=10485760
-        ''')
+            '''
+                CREATE TABLE table_with_adaptive_default_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/7/table_with_adaptive_default_granularity', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+                SETTINGS index_granularity_bytes=10485760
+            ''')
 
         node8.query(
-        '''
-            CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/8/table_with_default_granularity', '1')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-        ''')
+            '''
+                CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/8/table_with_default_granularity', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+            ''')
 
         node9.query(
-        '''
-            CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/9/table_with_default_granularity', '1')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-        ''')
+            '''
+                CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/9/table_with_default_granularity', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+            ''')
 
         node10.query(
-        '''
-            CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/10/table_with_default_granularity', '1')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-        ''')
+            '''
+                CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/10/table_with_default_granularity', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+            ''')
 
         node11.query(
-        '''
-            CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard11/table_with_default_granularity', '1')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-        ''')
+            '''
+                CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard11/table_with_default_granularity', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+            ''')
 
         node12.query(
-        '''
-            CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard11/table_with_default_granularity', '2')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-        ''')
-
+            '''
+                CREATE TABLE table_with_default_granularity(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard11/table_with_default_granularity', '2')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+            ''')
 
         yield cluster
 
     finally:
         cluster.shutdown()
 
+
 @pytest.mark.parametrize(
     ('n', 'tables'),
     [
@@ -251,13 +272,16 @@ def start_dynamic_cluster():
 )
 def test_version_single_node_update(start_dynamic_cluster, n, tables):
     for table in tables:
-        n.query("INSERT INTO {tbl} VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)".format(tbl=table))
+        n.query(
+            "INSERT INTO {tbl} VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)".format(tbl=table))
     n.restart_with_latest_version()
     for table in tables:
         assert n.query("SELECT count() from {tbl}".format(tbl=table)) == '2\n'
-        n.query("INSERT INTO {tbl} VALUES (toDate('2018-10-01'), 3, 333), (toDate('2018-10-02'), 4, 444)".format(tbl=table))
+        n.query(
+            "INSERT INTO {tbl} VALUES (toDate('2018-10-01'), 3, 333), (toDate('2018-10-02'), 4, 444)".format(tbl=table))
         assert n.query("SELECT count() from {tbl}".format(tbl=table)) == '4\n'
 
+
 @pytest.mark.parametrize(
     ('node',),
     [
@@ -266,27 +290,38 @@ def test_version_single_node_update(start_dynamic_cluster, n, tables):
     ]
 )
 def test_mixed_granularity_single_node(start_dynamic_cluster, node):
-    node.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
-    node.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-09-01'), 1, 333), (toDate('2018-09-02'), 2, 444)")
+    node.query(
+        "INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
+    node.query(
+        "INSERT INTO table_with_default_granularity VALUES (toDate('2018-09-01'), 1, 333), (toDate('2018-09-02'), 2, 444)")
 
     def callback(n):
-        n.replace_config("/etc/clickhouse-server/merge_tree_settings.xml", "<yandex><merge_tree><enable_mixed_granularity_parts>1</enable_mixed_granularity_parts></merge_tree></yandex>")
-        n.replace_config("/etc/clickhouse-server/config.d/merge_tree_settings.xml", "<yandex><merge_tree><enable_mixed_granularity_parts>1</enable_mixed_granularity_parts></merge_tree></yandex>")
+        n.replace_config("/etc/clickhouse-server/merge_tree_settings.xml",
+                         "<yandex><merge_tree><enable_mixed_granularity_parts>1</enable_mixed_granularity_parts></merge_tree></yandex>")
+        n.replace_config("/etc/clickhouse-server/config.d/merge_tree_settings.xml",
+                         "<yandex><merge_tree><enable_mixed_granularity_parts>1</enable_mixed_granularity_parts></merge_tree></yandex>")
 
     node.restart_with_latest_version(callback_onstop=callback)
     node.query("SYSTEM RELOAD CONFIG")
-    assert_eq_with_retry(node, "SELECT value FROM system.merge_tree_settings WHERE name='enable_mixed_granularity_parts'", '1')
+    assert_eq_with_retry(node,
+                         "SELECT value FROM system.merge_tree_settings WHERE name='enable_mixed_granularity_parts'",
+                         '1')
     assert node.query("SELECT count() from table_with_default_granularity") == '4\n'
-    node.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 3, 333), (toDate('2018-10-02'), 4, 444)")
+    node.query(
+        "INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 3, 333), (toDate('2018-10-02'), 4, 444)")
     assert node.query("SELECT count() from table_with_default_granularity") == '6\n'
     node.query("OPTIMIZE TABLE table_with_default_granularity PARTITION 201810 FINAL")
     assert node.query("SELECT count() from table_with_default_granularity") == '6\n'
-    path_to_merged_part = node.query("SELECT path FROM system.parts WHERE table = 'table_with_default_granularity' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
-    node.exec_in_container(["bash", "-c", "find {p} -name '*.mrk2' | grep '.*'".format(p=path_to_merged_part)]) # check that we have adaptive files
+    path_to_merged_part = node.query(
+        "SELECT path FROM system.parts WHERE table = 'table_with_default_granularity' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
+    node.exec_in_container(["bash", "-c", "find {p} -name '*.mrk2' | grep '.*'".format(
+        p=path_to_merged_part)])  # check that we have adaptive files
 
-    path_to_old_part = node.query("SELECT path FROM system.parts WHERE table = 'table_with_default_granularity' AND active=1 ORDER BY partition ASC LIMIT 1").strip()
+    path_to_old_part = node.query(
+        "SELECT path FROM system.parts WHERE table = 'table_with_default_granularity' AND active=1 ORDER BY partition ASC LIMIT 1").strip()
 
-    node.exec_in_container(["bash", "-c", "find {p} -name '*.mrk' | grep '.*'".format(p=path_to_old_part)]) # check that we have non adaptive files
+    node.exec_in_container(["bash", "-c", "find {p} -name '*.mrk' | grep '.*'".format(
+        p=path_to_old_part)])  # check that we have non adaptive files
 
     node.query("ALTER TABLE table_with_default_granularity UPDATE dummy = dummy + 1 WHERE 1")
     # still works
@@ -295,46 +330,54 @@ def test_mixed_granularity_single_node(start_dynamic_cluster, node):
     node.query("ALTER TABLE table_with_default_granularity MODIFY COLUMN dummy String")
     node.query("ALTER TABLE table_with_default_granularity ADD COLUMN dummy2 Float64")
 
-    #still works
+    # still works
     assert node.query("SELECT count() from table_with_default_granularity") == '6\n'
 
+
 @pytest.mark.skip(reason="flaky")
 def test_version_update_two_nodes(start_dynamic_cluster):
-    node11.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
+    node11.query(
+        "INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
     node12.query("SYSTEM SYNC REPLICA table_with_default_granularity", timeout=20)
     assert node12.query("SELECT COUNT() FROM table_with_default_granularity") == '2\n'
+
     def callback(n):
-        n.replace_config("/etc/clickhouse-server/merge_tree_settings.xml", "<yandex><merge_tree><enable_mixed_granularity_parts>0</enable_mixed_granularity_parts></merge_tree></yandex>")
-        n.replace_config("/etc/clickhouse-server/config.d/merge_tree_settings.xml", "<yandex><merge_tree><enable_mixed_granularity_parts>0</enable_mixed_granularity_parts></merge_tree></yandex>")
+        n.replace_config("/etc/clickhouse-server/merge_tree_settings.xml",
+                         "<yandex><merge_tree><enable_mixed_granularity_parts>0</enable_mixed_granularity_parts></merge_tree></yandex>")
+        n.replace_config("/etc/clickhouse-server/config.d/merge_tree_settings.xml",
+                         "<yandex><merge_tree><enable_mixed_granularity_parts>0</enable_mixed_granularity_parts></merge_tree></yandex>")
 
     node12.restart_with_latest_version(callback_onstop=callback)
 
-    node12.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 3, 333), (toDate('2018-10-02'), 4, 444)")
+    node12.query(
+        "INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 3, 333), (toDate('2018-10-02'), 4, 444)")
     node11.query("SYSTEM SYNC REPLICA table_with_default_granularity", timeout=20)
     assert node11.query("SELECT COUNT() FROM table_with_default_granularity") == '4\n'
 
     node12.query(
-    '''
-        CREATE TABLE table_with_default_granularity_new(date Date, id UInt32, dummy UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard11/table_with_default_granularity_new', '2')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-    ''')
+        '''
+            CREATE TABLE table_with_default_granularity_new(date Date, id UInt32, dummy UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard11/table_with_default_granularity_new', '2')
+            PARTITION BY toYYYYMM(date)
+            ORDER BY id
+        ''')
 
     node11.query(
-    '''
-        CREATE TABLE table_with_default_granularity_new(date Date, id UInt32, dummy UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard11/table_with_default_granularity_new', '1')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-    ''')
+        '''
+            CREATE TABLE table_with_default_granularity_new(date Date, id UInt32, dummy UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard11/table_with_default_granularity_new', '1')
+            PARTITION BY toYYYYMM(date)
+            ORDER BY id
+        ''')
 
-    node12.query("INSERT INTO table_with_default_granularity_new VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
+    node12.query(
+        "INSERT INTO table_with_default_granularity_new VALUES (toDate('2018-10-01'), 1, 333), (toDate('2018-10-02'), 2, 444)")
     with pytest.raises(QueryTimeoutExceedException):
         node11.query("SYSTEM SYNC REPLICA table_with_default_granularity_new", timeout=20)
-    node12.query("INSERT INTO table_with_default_granularity_new VALUES (toDate('2018-10-01'), 3, 333), (toDate('2018-10-02'), 4, 444)")
+    node12.query(
+        "INSERT INTO table_with_default_granularity_new VALUES (toDate('2018-10-01'), 3, 333), (toDate('2018-10-02'), 4, 444)")
 
-    node11.restart_with_latest_version(callback_onstop=callback) # just to be sure
+    node11.restart_with_latest_version(callback_onstop=callback)  # just to be sure
 
     for i in range(3):
         try:
@@ -350,7 +393,8 @@ def test_version_update_two_nodes(start_dynamic_cluster):
     assert node11.query("SELECT COUNT() FROM table_with_default_granularity_new") == "4\n"
     assert node12.query("SELECT COUNT() FROM table_with_default_granularity_new") == "4\n"
 
-    node11.query("INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 5, 333), (toDate('2018-10-02'), 6, 444)")
+    node11.query(
+        "INSERT INTO table_with_default_granularity VALUES (toDate('2018-10-01'), 5, 333), (toDate('2018-10-02'), 6, 444)")
     for i in range(3):
         try:
             node12.query("SYSTEM SYNC REPLICA table_with_default_granularity", timeout=120)
diff --git a/tests/integration/test_adaptive_granularity_different_settings/test.py b/tests/integration/test_adaptive_granularity_different_settings/test.py
index d84b438f77f..55b7e1c91b8 100644
--- a/tests/integration/test_adaptive_granularity_different_settings/test.py
+++ b/tests/integration/test_adaptive_granularity_different_settings/test.py
@@ -7,7 +7,9 @@ node1 = cluster.add_instance('node1', with_zookeeper=True)
 node2 = cluster.add_instance('node2', with_zookeeper=True)
 
 # no adaptive granularity by default
-node3 = cluster.add_instance('node3', image='yandex/clickhouse-server', tag='19.9.5.36', with_installed_binary=True, stay_alive=True)
+node3 = cluster.add_instance('node3', image='yandex/clickhouse-server', tag='19.9.5.36', with_installed_binary=True,
+                             stay_alive=True)
+
 
 @pytest.fixture(scope="module")
 def start_cluster():
@@ -20,7 +22,6 @@ def start_cluster():
 
 
 def test_attach_detach(start_cluster):
-
     node1.query("""
         CREATE TABLE test (key UInt64)
         ENGINE = ReplicatedMergeTree('/clickhouse/test', '1')
@@ -58,7 +59,8 @@ def test_mutate_with_mixed_granularity(start_cluster):
         ENGINE = MergeTree
         ORDER BY key PARTITION BY date""")
 
-    node3.query("INSERT INTO test SELECT toDate('2019-10-01') + number % 5, number, toString(number), toString(number * number) FROM numbers(500)")
+    node3.query(
+        "INSERT INTO test SELECT toDate('2019-10-01') + number % 5, number, toString(number), toString(number * number) FROM numbers(500)")
 
     assert node3.query("SELECT COUNT() FROM test") == "500\n"
 
@@ -68,7 +70,8 @@ def test_mutate_with_mixed_granularity(start_cluster):
 
     node3.query("ALTER TABLE test MODIFY SETTING enable_mixed_granularity_parts = 1")
 
-    node3.query("INSERT INTO test SELECT toDate('2019-10-01') + number % 5, number, toString(number), toString(number * number) FROM numbers(500, 500)")
+    node3.query(
+        "INSERT INTO test SELECT toDate('2019-10-01') + number % 5, number, toString(number), toString(number * number) FROM numbers(500, 500)")
 
     assert node3.query("SELECT COUNT() FROM test") == "1000\n"
     assert node3.query("SELECT COUNT() FROM test WHERE key % 100 == 0") == "10\n"
diff --git a/tests/integration/test_adaptive_granularity_replicated/test.py b/tests/integration/test_adaptive_granularity_replicated/test.py
index 87956c82661..5903cb85603 100644
--- a/tests/integration/test_adaptive_granularity_replicated/test.py
+++ b/tests/integration/test_adaptive_granularity_replicated/test.py
@@ -1,17 +1,15 @@
 import time
+
 import pytest
-
 from helpers.cluster import ClickHouseCluster
-from multiprocessing.dummy import Pool
-from helpers.client import QueryRuntimeException, QueryTimeoutExceedException
-
-from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1', with_zookeeper=True)
 node2 = cluster.add_instance('node2', with_zookeeper=True)
-node3 = cluster.add_instance('node3', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.14', with_installed_binary=True)
+node3 = cluster.add_instance('node3', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.14',
+                             with_installed_binary=True)
+
 
 @pytest.fixture(scope="module")
 def start_cluster():
@@ -23,11 +21,14 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_creating_table_different_setting(start_cluster):
-    node1.query("CREATE TABLE t1 (c1 String, c2 String) ENGINE=ReplicatedMergeTree('/clickhouse/t1', '1') ORDER BY tuple(c1) SETTINGS index_granularity_bytes = 0")
+    node1.query(
+        "CREATE TABLE t1 (c1 String, c2 String) ENGINE=ReplicatedMergeTree('/clickhouse/t1', '1') ORDER BY tuple(c1) SETTINGS index_granularity_bytes = 0")
     node1.query("INSERT INTO t1 VALUES('x', 'y')")
 
-    node2.query("CREATE TABLE t1 (c1 String, c2 String) ENGINE=ReplicatedMergeTree('/clickhouse/t1', '2') ORDER BY tuple(c1) SETTINGS enable_mixed_granularity_parts = 0")
+    node2.query(
+        "CREATE TABLE t1 (c1 String, c2 String) ENGINE=ReplicatedMergeTree('/clickhouse/t1', '2') ORDER BY tuple(c1) SETTINGS enable_mixed_granularity_parts = 0")
 
     node1.query("INSERT INTO t1 VALUES('a', 'b')")
     node2.query("SYSTEM SYNC REPLICA t1", timeout=5)
@@ -49,22 +50,26 @@ def test_creating_table_different_setting(start_cluster):
     node1.query("SELECT count() FROM t1") == "3\n"
     node2.query("SELECT count() FROM t1") == "2\n"
 
-    path_part = node1.query("SELECT path FROM system.parts WHERE table = 't1' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
+    path_part = node1.query(
+        "SELECT path FROM system.parts WHERE table = 't1' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
 
-    with pytest.raises(Exception): # check that we have no adaptive files
+    with pytest.raises(Exception):  # check that we have no adaptive files
         node1.exec_in_container(["bash", "-c", "find {p} -name '*.mrk2' | grep '.*'".format(p=path_part)])
 
-    path_part = node2.query("SELECT path FROM system.parts WHERE table = 't1' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
+    path_part = node2.query(
+        "SELECT path FROM system.parts WHERE table = 't1' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
 
-    with pytest.raises(Exception): # check that we have no adaptive files
+    with pytest.raises(Exception):  # check that we have no adaptive files
         node2.exec_in_container(["bash", "-c", "find {p} -name '*.mrk2' | grep '.*'".format(p=path_part)])
 
 
 def test_old_node_with_new_node(start_cluster):
-    node3.query("CREATE TABLE t2 (c1 String, c2 String) ENGINE=ReplicatedMergeTree('/clickhouse/t2', '3') ORDER BY tuple(c1)")
+    node3.query(
+        "CREATE TABLE t2 (c1 String, c2 String) ENGINE=ReplicatedMergeTree('/clickhouse/t2', '3') ORDER BY tuple(c1)")
     node3.query("INSERT INTO t2 VALUES('x', 'y')")
 
-    node2.query("CREATE TABLE t2 (c1 String, c2 String) ENGINE=ReplicatedMergeTree('/clickhouse/t2', '2') ORDER BY tuple(c1) SETTINGS enable_mixed_granularity_parts = 0")
+    node2.query(
+        "CREATE TABLE t2 (c1 String, c2 String) ENGINE=ReplicatedMergeTree('/clickhouse/t2', '2') ORDER BY tuple(c1) SETTINGS enable_mixed_granularity_parts = 0")
 
     node3.query("INSERT INTO t2 VALUES('a', 'b')")
     node2.query("SYSTEM SYNC REPLICA t2", timeout=5)
@@ -86,12 +91,14 @@ def test_old_node_with_new_node(start_cluster):
     node3.query("SELECT count() FROM t2") == "3\n"
     node2.query("SELECT count() FROM t2") == "2\n"
 
-    path_part = node3.query("SELECT path FROM system.parts WHERE table = 't2' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
+    path_part = node3.query(
+        "SELECT path FROM system.parts WHERE table = 't2' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
 
-    with pytest.raises(Exception): # check that we have no adaptive files
+    with pytest.raises(Exception):  # check that we have no adaptive files
         node3.exec_in_container(["bash", "-c", "find {p} -name '*.mrk2' | grep '.*'".format(p=path_part)])
 
-    path_part = node2.query("SELECT path FROM system.parts WHERE table = 't2' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
+    path_part = node2.query(
+        "SELECT path FROM system.parts WHERE table = 't2' AND active=1 ORDER BY partition DESC LIMIT 1").strip()
 
-    with pytest.raises(Exception): # check that we have no adaptive files
+    with pytest.raises(Exception):  # check that we have no adaptive files
         node2.exec_in_container(["bash", "-c", "find {p} -name '*.mrk2' | grep '.*'".format(p=path_part)])
diff --git a/tests/integration/test_aggregation_memory_efficient/test.py b/tests/integration/test_aggregation_memory_efficient/test.py
index 3a7ada5f02e..db0449173ca 100644
--- a/tests/integration/test_aggregation_memory_efficient/test.py
+++ b/tests/integration/test_aggregation_memory_efficient/test.py
@@ -1,22 +1,20 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
-from helpers.client import QueryRuntimeException, QueryTimeoutExceedException
-
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1')
 node2 = cluster.add_instance('node2')
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
         cluster.start()
 
         for node in [node1, node2]:
-            node.query("create table da_memory_efficient_shard(A Int64, B Int64) Engine=MergeTree order by A partition by B % 2;")
-
+            node.query(
+                "create table da_memory_efficient_shard(A Int64, B Int64) Engine=MergeTree order by A partition by B % 2;")
 
         node1.query("insert into da_memory_efficient_shard select number, number from numbers(100000);")
         node2.query("insert into da_memory_efficient_shard select number + 100000, number from numbers(100000);")
@@ -28,19 +26,24 @@ def start_cluster():
 
 
 def test_remote(start_cluster):
-
-    node1.query("set distributed_aggregation_memory_efficient = 1, group_by_two_level_threshold = 1, group_by_two_level_threshold_bytes=1")
-    res = node1.query("select sum(a) from (SELECT B, uniqExact(A) a FROM remote('node{1,2}', default.da_memory_efficient_shard) GROUP BY B)")
+    node1.query(
+        "set distributed_aggregation_memory_efficient = 1, group_by_two_level_threshold = 1, group_by_two_level_threshold_bytes=1")
+    res = node1.query(
+        "select sum(a) from (SELECT B, uniqExact(A) a FROM remote('node{1,2}', default.da_memory_efficient_shard) GROUP BY B)")
     assert res == '200000\n'
 
     node1.query("set distributed_aggregation_memory_efficient = 0")
-    res = node1.query("select sum(a) from (SELECT B, uniqExact(A) a FROM remote('node{1,2}', default.da_memory_efficient_shard) GROUP BY B)")
+    res = node1.query(
+        "select sum(a) from (SELECT B, uniqExact(A) a FROM remote('node{1,2}', default.da_memory_efficient_shard) GROUP BY B)")
     assert res == '200000\n'
 
-    node1.query("set distributed_aggregation_memory_efficient = 1, group_by_two_level_threshold = 1, group_by_two_level_threshold_bytes=1")
-    res = node1.query("SELECT fullHostName() AS h, uniqExact(A) AS a FROM remote('node{1,2}', default.da_memory_efficient_shard) GROUP BY h ORDER BY h;")
+    node1.query(
+        "set distributed_aggregation_memory_efficient = 1, group_by_two_level_threshold = 1, group_by_two_level_threshold_bytes=1")
+    res = node1.query(
+        "SELECT fullHostName() AS h, uniqExact(A) AS a FROM remote('node{1,2}', default.da_memory_efficient_shard) GROUP BY h ORDER BY h;")
     assert res == 'node1\t100000\nnode2\t100000\n'
 
     node1.query("set distributed_aggregation_memory_efficient = 0")
-    res = node1.query("SELECT fullHostName() AS h, uniqExact(A) AS a FROM remote('node{1,2}', default.da_memory_efficient_shard) GROUP BY h ORDER BY h;")
+    res = node1.query(
+        "SELECT fullHostName() AS h, uniqExact(A) AS a FROM remote('node{1,2}', default.da_memory_efficient_shard) GROUP BY h ORDER BY h;")
     assert res == 'node1\t100000\nnode2\t100000\n'
diff --git a/tests/integration/test_allowed_client_hosts/test.py b/tests/integration/test_allowed_client_hosts/test.py
index f187b6d889c..e60e488b3ae 100644
--- a/tests/integration/test_allowed_client_hosts/test.py
+++ b/tests/integration/test_allowed_client_hosts/test.py
@@ -1,32 +1,32 @@
-import os
 import pytest
 from helpers.cluster import ClickHouseCluster
 
-
 cluster = ClickHouseCluster(__file__)
 server = cluster.add_instance('server', user_configs=["configs/users.d/network.xml"])
 
-clientA1 = cluster.add_instance('clientA1', hostname = 'clientA1.com')
-clientA2 = cluster.add_instance('clientA2', hostname = 'clientA2.com')
-clientA3 = cluster.add_instance('clientA3', hostname = 'clientA3.com')
-clientB1 = cluster.add_instance('clientB1', hostname = 'clientB001.ru')
-clientB2 = cluster.add_instance('clientB2', hostname = 'clientB002.ru')
-clientB3 = cluster.add_instance('clientB3', hostname = 'xxx.clientB003.rutracker.com')
-clientC1 = cluster.add_instance('clientC1', hostname = 'clientC01.ru')
-clientC2 = cluster.add_instance('clientC2', hostname = 'xxx.clientC02.ru')
-clientC3 = cluster.add_instance('clientC3', hostname = 'xxx.clientC03.rutracker.com')
-clientD1 = cluster.add_instance('clientD1', hostname = 'clientD0001.ru')
-clientD2 = cluster.add_instance('clientD2', hostname = 'xxx.clientD0002.ru')
-clientD3 = cluster.add_instance('clientD3', hostname = 'clientD0003.ru')
+clientA1 = cluster.add_instance('clientA1', hostname='clientA1.com')
+clientA2 = cluster.add_instance('clientA2', hostname='clientA2.com')
+clientA3 = cluster.add_instance('clientA3', hostname='clientA3.com')
+clientB1 = cluster.add_instance('clientB1', hostname='clientB001.ru')
+clientB2 = cluster.add_instance('clientB2', hostname='clientB002.ru')
+clientB3 = cluster.add_instance('clientB3', hostname='xxx.clientB003.rutracker.com')
+clientC1 = cluster.add_instance('clientC1', hostname='clientC01.ru')
+clientC2 = cluster.add_instance('clientC2', hostname='xxx.clientC02.ru')
+clientC3 = cluster.add_instance('clientC3', hostname='xxx.clientC03.rutracker.com')
+clientD1 = cluster.add_instance('clientD1', hostname='clientD0001.ru')
+clientD2 = cluster.add_instance('clientD2', hostname='xxx.clientD0002.ru')
+clientD3 = cluster.add_instance('clientD3', hostname='clientD0003.ru')
 
 
 def check_clickhouse_is_ok(client_node, server_node):
-    assert client_node.exec_in_container(["bash", "-c", "/usr/bin/curl -s {}:8123 ".format(server_node.hostname)]) == "Ok.\n"
+    assert client_node.exec_in_container(
+        ["bash", "-c", "/usr/bin/curl -s {}:8123 ".format(server_node.hostname)]) == "Ok.\n"
 
 
 def query_from_one_node_to_another(client_node, server_node, query):
     check_clickhouse_is_ok(client_node, server_node)
-    return client_node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host {} --query {!r}".format(server_node.hostname, query)])
+    return client_node.exec_in_container(
+        ["bash", "-c", "/usr/bin/clickhouse client --host {} --query {!r}".format(server_node.hostname, query)])
 
 
 def query(node, query):
@@ -53,8 +53,8 @@ def test_allowed_host():
     # Reverse DNS lookup currently isn't working as expected in this test.
     # For example, it gives something like "vitbartestallowedclienthosts_clientB1_1.vitbartestallowedclienthosts_default" instead of "clientB001.ru".
     # Maybe we should setup the test network better.
-    #expected_to_pass.extend([clientB1, clientB2, clientB3, clientC1, clientC2, clientD1, clientD3])
-    #expected_to_fail.extend([clientC3, clientD2])
+    # expected_to_pass.extend([clientB1, clientB2, clientB3, clientC1, clientC2, clientD1, clientD3])
+    # expected_to_fail.extend([clientC3, clientD2])
 
     for client_node in expected_to_pass:
         assert query_from_one_node_to_another(client_node, server, "SELECT * FROM test_table") == "5\n"
diff --git a/tests/integration/test_allowed_url_from_config/test.py b/tests/integration/test_allowed_url_from_config/test.py
index 2a666e4e2ec..44715d92121 100644
--- a/tests/integration/test_allowed_url_from_config/test.py
+++ b/tests/integration/test_allowed_url_from_config/test.py
@@ -1,8 +1,6 @@
-import time
 import pytest
-
-from helpers.hdfs_api import HDFSApi
 from helpers.cluster import ClickHouseCluster
+from helpers.hdfs_api import HDFSApi
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/config_with_hosts.xml'])
@@ -21,26 +19,37 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_config_with_hosts(start_cluster):
     assert node1.query("CREATE TABLE table_test_1_1 (word String) Engine=URL('http://host:80', HDFS)") == ""
     assert node1.query("CREATE TABLE table_test_1_2 (word String) Engine=URL('https://yandex.ru', CSV)") == ""
-    assert "not allowed" in node1.query_and_get_error("CREATE TABLE table_test_1_4 (word String) Engine=URL('https://host:123', S3)")
-    assert "not allowed" in node1.query_and_get_error("CREATE TABLE table_test_1_4 (word String) Engine=URL('https://yandex2.ru', CSV)")
+    assert "not allowed" in node1.query_and_get_error(
+        "CREATE TABLE table_test_1_4 (word String) Engine=URL('https://host:123', S3)")
+    assert "not allowed" in node1.query_and_get_error(
+        "CREATE TABLE table_test_1_4 (word String) Engine=URL('https://yandex2.ru', CSV)")
+
 
 def test_config_with_only_primary_hosts(start_cluster):
     assert node2.query("CREATE TABLE table_test_2_1 (word String) Engine=URL('https://host:80', CSV)") == ""
     assert node2.query("CREATE TABLE table_test_2_2 (word String) Engine=URL('https://host:123', S3)") == ""
     assert node2.query("CREATE TABLE table_test_2_3 (word String) Engine=URL('https://yandex.ru', CSV)") == ""
     assert node2.query("CREATE TABLE table_test_2_4 (word String) Engine=URL('https://yandex.ru:87', HDFS)") == ""
-    assert "not allowed" in node2.query_and_get_error("CREATE TABLE table_test_2_5 (word String) Engine=URL('https://host', HDFS)")
-    assert "not allowed" in node2.query_and_get_error("CREATE TABLE table_test_2_5 (word String) Engine=URL('https://host:234', CSV)")
-    assert "not allowed" in node2.query_and_get_error("CREATE TABLE table_test_2_6 (word String) Engine=URL('https://yandex2.ru', S3)")
+    assert "not allowed" in node2.query_and_get_error(
+        "CREATE TABLE table_test_2_5 (word String) Engine=URL('https://host', HDFS)")
+    assert "not allowed" in node2.query_and_get_error(
+        "CREATE TABLE table_test_2_5 (word String) Engine=URL('https://host:234', CSV)")
+    assert "not allowed" in node2.query_and_get_error(
+        "CREATE TABLE table_test_2_6 (word String) Engine=URL('https://yandex2.ru', S3)")
+
 
 def test_config_with_only_regexp_hosts(start_cluster):
     assert node3.query("CREATE TABLE table_test_3_1 (word String) Engine=URL('https://host:80', HDFS)") == ""
     assert node3.query("CREATE TABLE table_test_3_2 (word String) Engine=URL('https://yandex.ru', CSV)") == ""
-    assert "not allowed" in node3.query_and_get_error("CREATE TABLE table_test_3_3 (word String) Engine=URL('https://host', CSV)")
-    assert "not allowed" in node3.query_and_get_error("CREATE TABLE table_test_3_4 (word String) Engine=URL('https://yandex2.ru', S3)")
+    assert "not allowed" in node3.query_and_get_error(
+        "CREATE TABLE table_test_3_3 (word String) Engine=URL('https://host', CSV)")
+    assert "not allowed" in node3.query_and_get_error(
+        "CREATE TABLE table_test_3_4 (word String) Engine=URL('https://yandex2.ru', S3)")
+
 
 def test_config_without_allowed_hosts(start_cluster):
     assert node4.query("CREATE TABLE table_test_4_1 (word String) Engine=URL('https://host:80', CSV)") == ""
@@ -48,27 +57,60 @@ def test_config_without_allowed_hosts(start_cluster):
     assert node4.query("CREATE TABLE table_test_4_3 (word String) Engine=URL('https://yandex.ru', CSV)") == ""
     assert node4.query("CREATE TABLE table_test_4_4 (word String) Engine=URL('ftp://something.com', S3)") == ""
 
+
 def test_table_function_remote(start_cluster):
-    assert "not allowed in config.xml" not in node6.query_and_get_error("SELECT * FROM remoteSecure('example01-01-{1|2}', system, events)", settings={"connections_with_failover_max_tries":1, "connect_timeout_with_failover_ms": 1000, "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout":1})
-    assert "not allowed in config.xml" not in node6.query_and_get_error("SELECT * FROM remoteSecure('example01-01-1,example01-02-1', system, events)", settings={"connections_with_failover_max_tries":1, "connect_timeout_with_failover_ms": 1000, "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout":1})
-    assert "not allowed in config.xml" not in node6.query_and_get_error("SELECT * FROM remote('example01-0{1,2}-1', system, events", settings={"connections_with_failover_max_tries":1, "connect_timeout_with_failover_ms": 1000, "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout":1})
-    assert "not allowed in config.xml" not in node6.query_and_get_error("SELECT * FROM remote('example01-0{1,2}-{1|2}', system, events)", settings={"connections_with_failover_max_tries":1, "connect_timeout_with_failover_ms": 1000, "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout":1})
-    assert "not allowed in config.xml" not in node6.query_and_get_error("SELECT * FROM remoteSecure('example01-{01..02}-{1|2}', system, events)", settings={"connections_with_failover_max_tries":1, "connect_timeout_with_failover_ms": 1000, "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout":1})
-    assert "not allowed" in node6.query_and_get_error("SELECT * FROM remoteSecure('example01-01-1,example01-03-1', system, events)", settings={"connections_with_failover_max_tries":1, "connect_timeout_with_failover_ms": 1000, "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout":1})
-    assert "not allowed" in node6.query_and_get_error("SELECT * FROM remote('example01-01-{1|3}', system, events)", settings={"connections_with_failover_max_tries":1, "connect_timeout_with_failover_ms": 1000, "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout":1})
-    assert "not allowed" in node6.query_and_get_error("SELECT * FROM remoteSecure('example01-0{1,3}-1', system, metrics)", settings={"connections_with_failover_max_tries":1, "connect_timeout_with_failover_ms": 1000, "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout":1})
+    assert "not allowed in config.xml" not in node6.query_and_get_error(
+        "SELECT * FROM remoteSecure('example01-01-{1|2}', system, events)",
+        settings={"connections_with_failover_max_tries": 1, "connect_timeout_with_failover_ms": 1000,
+                  "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout": 1})
+    assert "not allowed in config.xml" not in node6.query_and_get_error(
+        "SELECT * FROM remoteSecure('example01-01-1,example01-02-1', system, events)",
+        settings={"connections_with_failover_max_tries": 1, "connect_timeout_with_failover_ms": 1000,
+                  "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout": 1})
+    assert "not allowed in config.xml" not in node6.query_and_get_error(
+        "SELECT * FROM remote('example01-0{1,2}-1', system, events",
+        settings={"connections_with_failover_max_tries": 1, "connect_timeout_with_failover_ms": 1000,
+                  "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout": 1})
+    assert "not allowed in config.xml" not in node6.query_and_get_error(
+        "SELECT * FROM remote('example01-0{1,2}-{1|2}', system, events)",
+        settings={"connections_with_failover_max_tries": 1, "connect_timeout_with_failover_ms": 1000,
+                  "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout": 1})
+    assert "not allowed in config.xml" not in node6.query_and_get_error(
+        "SELECT * FROM remoteSecure('example01-{01..02}-{1|2}', system, events)",
+        settings={"connections_with_failover_max_tries": 1, "connect_timeout_with_failover_ms": 1000,
+                  "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout": 1})
+    assert "not allowed" in node6.query_and_get_error(
+        "SELECT * FROM remoteSecure('example01-01-1,example01-03-1', system, events)",
+        settings={"connections_with_failover_max_tries": 1, "connect_timeout_with_failover_ms": 1000,
+                  "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout": 1})
+    assert "not allowed" in node6.query_and_get_error("SELECT * FROM remote('example01-01-{1|3}', system, events)",
+                                                      settings={"connections_with_failover_max_tries": 1,
+                                                                "connect_timeout_with_failover_ms": 1000,
+                                                                "connect_timeout_with_failover_secure_ms": 1000,
+                                                                "connect_timeout": 1, "send_timeout": 1})
+    assert "not allowed" in node6.query_and_get_error(
+        "SELECT * FROM remoteSecure('example01-0{1,3}-1', system, metrics)",
+        settings={"connections_with_failover_max_tries": 1, "connect_timeout_with_failover_ms": 1000,
+                  "connect_timeout_with_failover_secure_ms": 1000, "connect_timeout": 1, "send_timeout": 1})
     assert node6.query("SELECT * FROM remote('localhost', system, events)") != ""
     assert node6.query("SELECT * FROM remoteSecure('localhost', system, metrics)") != ""
-    assert "URL \"localhost:800\" is not allowed in config.xml" in node6.query_and_get_error("SELECT * FROM remoteSecure('localhost:800', system, events)")
-    assert "URL \"localhost:800\" is not allowed in config.xml" in node6.query_and_get_error("SELECT * FROM remote('localhost:800', system, metrics)")
+    assert "URL \"localhost:800\" is not allowed in config.xml" in node6.query_and_get_error(
+        "SELECT * FROM remoteSecure('localhost:800', system, events)")
+    assert "URL \"localhost:800\" is not allowed in config.xml" in node6.query_and_get_error(
+        "SELECT * FROM remote('localhost:800', system, metrics)")
+
 
 def test_redirect(start_cluster):
     hdfs_api = HDFSApi("root")
     hdfs_api.write_data("/simple_storage", "1\t\n")
     assert hdfs_api.read_data("/simple_storage") == "1\t\n"
-    node7.query("CREATE TABLE table_test_7_1 (word String) ENGINE=URL('http://hdfs1:50070/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', CSV)")
+    node7.query(
+        "CREATE TABLE table_test_7_1 (word String) ENGINE=URL('http://hdfs1:50070/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', CSV)")
     assert "not allowed" in node7.query_and_get_error("SET max_http_get_redirects=1; SELECT * from table_test_7_1")
 
+
 def test_HDFS(start_cluster):
-    assert "not allowed" in node7.query_and_get_error("CREATE TABLE table_test_7_2 (word String) ENGINE=HDFS('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'CSV')")
-    assert "not allowed" in node7.query_and_get_error("SELECT * FROM hdfs('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV', 'word String')")
+    assert "not allowed" in node7.query_and_get_error(
+        "CREATE TABLE table_test_7_2 (word String) ENGINE=HDFS('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'CSV')")
+    assert "not allowed" in node7.query_and_get_error(
+        "SELECT * FROM hdfs('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV', 'word String')")
diff --git a/tests/integration/test_alter_codec/test.py b/tests/integration/test_alter_codec/test.py
index 4d251f60b16..f51dc9a54ff 100644
--- a/tests/integration/test_alter_codec/test.py
+++ b/tests/integration/test_alter_codec/test.py
@@ -2,14 +2,13 @@ import pytest
 from helpers.client import QueryRuntimeException
 from helpers.cluster import ClickHouseCluster
 
-
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1',
-            main_configs=['configs/logs_config.xml'])
+                             main_configs=['configs/logs_config.xml'])
 
 node2 = cluster.add_instance('node2',
-            main_configs=['configs/logs_config.xml'])
+                             main_configs=['configs/logs_config.xml'])
 
 
 @pytest.fixture(scope="module")
@@ -39,7 +38,6 @@ def test_alter_codec_pk(started_cluster):
         with pytest.raises(QueryRuntimeException):
             node1.query("ALTER TABLE {name} MODIFY COLUMN id UInt32 CODEC(Delta, LZ4)".format(name=name))
 
-
         node1.query("ALTER TABLE {name} MODIFY COLUMN id UInt64 DEFAULT 3 CODEC(Delta, LZ4)".format(name=name))
 
         node1.query("INSERT INTO {name} (value) VALUES (1)".format(name=name))
diff --git a/tests/integration/test_always_fetch_merged/test.py b/tests/integration/test_always_fetch_merged/test.py
index f471ec78eac..7ba8e05129b 100644
--- a/tests/integration/test_always_fetch_merged/test.py
+++ b/tests/integration/test_always_fetch_merged/test.py
@@ -1,14 +1,15 @@
-import pytest
 import time
+
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
-
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1', with_zookeeper=True)
 node2 = cluster.add_instance('node2', with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
diff --git a/tests/integration/test_asynchronous_metric_log_table/test.py b/tests/integration/test_asynchronous_metric_log_table/test.py
index 0eb72c20376..0091832aa7c 100644
--- a/tests/integration/test_asynchronous_metric_log_table/test.py
+++ b/tests/integration/test_asynchronous_metric_log_table/test.py
@@ -39,7 +39,7 @@ def test_event_time_microseconds_field(started_cluster):
         node1.query(query_create)
         node1.query('''INSERT INTO replica.test VALUES (1, now())''')
         node1.query("SYSTEM FLUSH LOGS;")
-        #query assumes that the event_time field is accurate
+        # query assumes that the event_time field is accurate
         equals_query = '''WITH (
                             (
                                 SELECT event_time_microseconds
diff --git a/tests/integration/test_atomic_drop_table/test.py b/tests/integration/test_atomic_drop_table/test.py
index ee79a3ff080..7ff06c7f369 100644
--- a/tests/integration/test_atomic_drop_table/test.py
+++ b/tests/integration/test_atomic_drop_table/test.py
@@ -1,12 +1,12 @@
 import time
+
 import pytest
-
-from helpers.network import PartitionManager
 from helpers.cluster import ClickHouseCluster
-
+from helpers.network import PartitionManager
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', main_configs=["configs/config.d/zookeeper_session_timeout.xml", "configs/remote_servers.xml"], with_zookeeper=True)
+node1 = cluster.add_instance('node1', main_configs=["configs/config.d/zookeeper_session_timeout.xml",
+                                                    "configs/remote_servers.xml"], with_zookeeper=True)
 
 
 @pytest.fixture(scope="module")
@@ -25,12 +25,13 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_atomic_delete_with_stopped_zookeeper(start_cluster):
     node1.query("insert into zktest.atomic_drop_table values (8192)")
 
     with PartitionManager() as pm:
         pm.drop_instance_zk_connections(node1)
-        error = node1.query_and_get_error("DROP TABLE zktest.atomic_drop_table") #Table won't drop
+        error = node1.query_and_get_error("DROP TABLE zktest.atomic_drop_table")  # Table won't drop
         assert error != ""
 
     time.sleep(5)
diff --git a/tests/integration/test_attach_without_checksums/test.py b/tests/integration/test_attach_without_checksums/test.py
index 85dbc59e6f3..536ab4467ea 100644
--- a/tests/integration/test_attach_without_checksums/test.py
+++ b/tests/integration/test_attach_without_checksums/test.py
@@ -17,7 +17,8 @@ def start_cluster():
 
 
 def test_attach_without_checksums(start_cluster):
-    node1.query("CREATE TABLE test (date Date, key Int32, value String) Engine=MergeTree ORDER BY key PARTITION by date")
+    node1.query(
+        "CREATE TABLE test (date Date, key Int32, value String) Engine=MergeTree ORDER BY key PARTITION by date")
 
     node1.query("INSERT INTO test SELECT toDate('2019-10-01'), number, toString(number) FROM numbers(100)")
 
@@ -29,9 +30,13 @@ def test_attach_without_checksums(start_cluster):
     assert node1.query("SELECT COUNT() FROM test") == "0\n"
 
     # to be sure output not empty
-    node1.exec_in_container(['bash', '-c', 'find /var/lib/clickhouse/data/default/test/detached -name "checksums.txt" | grep -e ".*" '], privileged=True, user='root')
+    node1.exec_in_container(
+        ['bash', '-c', 'find /var/lib/clickhouse/data/default/test/detached -name "checksums.txt" | grep -e ".*" '],
+        privileged=True, user='root')
 
-    node1.exec_in_container(['bash', '-c', 'find /var/lib/clickhouse/data/default/test/detached -name "checksums.txt" -delete'], privileged=True, user='root')
+    node1.exec_in_container(
+        ['bash', '-c', 'find /var/lib/clickhouse/data/default/test/detached -name "checksums.txt" -delete'],
+        privileged=True, user='root')
 
     node1.query("ALTER TABLE test ATTACH PARTITION '2019-10-01'")
 
diff --git a/tests/integration/test_authentication/test.py b/tests/integration/test_authentication/test.py
index dedd5410188..0651efa11b4 100644
--- a/tests/integration/test_authentication/test.py
+++ b/tests/integration/test_authentication/test.py
@@ -30,7 +30,8 @@ def test_authentication_pass():
 
 def test_authentication_fail():
     # User doesn't exist.
-    assert "vasya: Authentication failed" in instance.query_and_get_error("SELECT currentUser()", user = 'vasya')
-    
+    assert "vasya: Authentication failed" in instance.query_and_get_error("SELECT currentUser()", user='vasya')
+
     # Wrong password.
-    assert "masha: Authentication failed" in instance.query_and_get_error("SELECT currentUser()", user = 'masha', password = '123')
+    assert "masha: Authentication failed" in instance.query_and_get_error("SELECT currentUser()", user='masha',
+                                                                          password='123')
diff --git a/tests/integration/test_backup_restore/test.py b/tests/integration/test_backup_restore/test.py
index 46d687f7019..111dc6d24f8 100644
--- a/tests/integration/test_backup_restore/test.py
+++ b/tests/integration/test_backup_restore/test.py
@@ -1,10 +1,9 @@
 import os.path
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
-
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance')
 q = instance.query
@@ -47,7 +46,7 @@ def backup_restore(started_cluster):
 
     expected = TSV('1970-01-02\t1\n1970-01-03\t2\n1970-01-04\t3\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33')
     res = q("SELECT * FROM test.tbl ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     q("ALTER TABLE test.tbl FREEZE")
 
@@ -69,7 +68,7 @@ def test_restore(backup_restore):
     # Validate the attached parts are identical to the backup.
     expected = TSV('1970-01-02\t1\n1970-01-03\t2\n1970-01-04\t3\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33')
     res = q("SELECT * FROM test.tbl1 ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     q("ALTER TABLE test.tbl1 UPDATE k=10 WHERE 1")
     q("SELECT sleep(2)")
@@ -77,7 +76,7 @@ def test_restore(backup_restore):
     # Validate mutation has been applied to all attached parts.
     expected = TSV('1970-01-02\t10\n1970-01-03\t10\n1970-01-04\t10\n1970-02-01\t10\n1970-02-02\t10\n1970-02-03\t10')
     res = q("SELECT * FROM test.tbl1 ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     q("DROP TABLE IF EXISTS test.tbl1")
 
@@ -91,7 +90,7 @@ def test_attach_partition(backup_restore):
 
     expected = TSV('1970-01-04\t3\n1970-01-05\t4\n1970-02-03\t33\n1970-02-04\t34')
     res = q("SELECT * FROM test.tbl2 ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     copy_backup_to_detached('test', 'tbl', 'tbl2')
 
@@ -102,17 +101,19 @@ def test_attach_partition(backup_restore):
     q("ALTER TABLE test.tbl2 ATTACH PARTITION 197002")
     q("SELECT sleep(2)")
 
-    expected = TSV('1970-01-02\t1\n1970-01-03\t2\n1970-01-04\t3\n1970-01-04\t3\n1970-01-05\t4\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33\n1970-02-03\t33\n1970-02-04\t34')
+    expected = TSV(
+        '1970-01-02\t1\n1970-01-03\t2\n1970-01-04\t3\n1970-01-04\t3\n1970-01-05\t4\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33\n1970-02-03\t33\n1970-02-04\t34')
     res = q("SELECT * FROM test.tbl2 ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     q("ALTER TABLE test.tbl2 UPDATE k=10 WHERE 1")
     q("SELECT sleep(2)")
 
     # Validate mutation has been applied to all attached parts.
-    expected = TSV('1970-01-02\t10\n1970-01-03\t10\n1970-01-04\t10\n1970-01-04\t10\n1970-01-05\t10\n1970-02-01\t10\n1970-02-02\t10\n1970-02-03\t10\n1970-02-03\t10\n1970-02-04\t10')
+    expected = TSV(
+        '1970-01-02\t10\n1970-01-03\t10\n1970-01-04\t10\n1970-01-04\t10\n1970-01-05\t10\n1970-02-01\t10\n1970-02-02\t10\n1970-02-03\t10\n1970-02-03\t10\n1970-02-04\t10')
     res = q("SELECT * FROM test.tbl2 ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     q("DROP TABLE IF EXISTS test.tbl2")
 
@@ -126,7 +127,7 @@ def test_replace_partition(backup_restore):
 
     expected = TSV('1970-01-04\t3\n1970-01-05\t4\n1970-02-03\t33\n1970-02-04\t34')
     res = q("SELECT * FROM test.tbl3 ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     copy_backup_to_detached('test', 'tbl', 'tbl3')
 
@@ -138,7 +139,7 @@ def test_replace_partition(backup_restore):
 
     expected = TSV('1970-01-04\t3\n1970-01-05\t4\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33')
     res = q("SELECT * FROM test.tbl3 ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     q("ALTER TABLE test.tbl3 UPDATE k=10 WHERE 1")
     q("SELECT sleep(2)")
@@ -146,6 +147,6 @@ def test_replace_partition(backup_restore):
     # Validate mutation has been applied to all copied parts.
     expected = TSV('1970-01-04\t10\n1970-01-05\t10\n1970-02-01\t10\n1970-02-02\t10\n1970-02-03\t10')
     res = q("SELECT * FROM test.tbl3 ORDER BY p")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
     q("DROP TABLE IF EXISTS test.tbl3")
diff --git a/tests/integration/test_backup_with_other_granularity/test.py b/tests/integration/test_backup_with_other_granularity/test.py
index c27cd732a05..9b7833bef63 100644
--- a/tests/integration/test_backup_with_other_granularity/test.py
+++ b/tests/integration/test_backup_with_other_granularity/test.py
@@ -1,13 +1,15 @@
 import pytest
 
-
 from helpers.cluster import ClickHouseCluster
+
 cluster = ClickHouseCluster(__file__)
 
-
-node1 = cluster.add_instance('node1', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.4.5.35', stay_alive=True, with_installed_binary=True)
-node2 = cluster.add_instance('node2', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.4.5.35', stay_alive=True, with_installed_binary=True)
-node3 = cluster.add_instance('node3', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.4.5.35', stay_alive=True, with_installed_binary=True)
+node1 = cluster.add_instance('node1', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.4.5.35',
+                             stay_alive=True, with_installed_binary=True)
+node2 = cluster.add_instance('node2', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.4.5.35',
+                             stay_alive=True, with_installed_binary=True)
+node3 = cluster.add_instance('node3', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.4.5.35',
+                             stay_alive=True, with_installed_binary=True)
 node4 = cluster.add_instance('node4')
 
 
@@ -33,13 +35,15 @@ def test_backup_from_old_version(started_cluster):
 
     node1.restart_with_latest_version()
 
-    node1.query("CREATE TABLE dest_table (A Int64,  B String,  Y String) ENGINE = ReplicatedMergeTree('/test/dest_table1', '1')  ORDER BY tuple()")
+    node1.query(
+        "CREATE TABLE dest_table (A Int64,  B String,  Y String) ENGINE = ReplicatedMergeTree('/test/dest_table1', '1')  ORDER BY tuple()")
 
     node1.query("INSERT INTO dest_table VALUES(2, '2', 'Hello')")
 
     assert node1.query("SELECT COUNT() FROM dest_table") == "1\n"
 
-    node1.exec_in_container(['bash', '-c', 'cp -r /var/lib/clickhouse/shadow/1/data/default/source_table/all_1_1_0/ /var/lib/clickhouse/data/default/dest_table/detached'])
+    node1.exec_in_container(['bash', '-c',
+                             'cp -r /var/lib/clickhouse/shadow/1/data/default/source_table/all_1_1_0/ /var/lib/clickhouse/data/default/dest_table/detached'])
 
     assert node1.query("SELECT COUNT() FROM dest_table") == "1\n"
 
@@ -69,13 +73,15 @@ def test_backup_from_old_version_setting(started_cluster):
 
     node2.restart_with_latest_version()
 
-    node2.query("CREATE TABLE dest_table (A Int64,  B String,  Y String) ENGINE = ReplicatedMergeTree('/test/dest_table2', '1')  ORDER BY tuple() SETTINGS enable_mixed_granularity_parts = 1")
+    node2.query(
+        "CREATE TABLE dest_table (A Int64,  B String,  Y String) ENGINE = ReplicatedMergeTree('/test/dest_table2', '1')  ORDER BY tuple() SETTINGS enable_mixed_granularity_parts = 1")
 
     node2.query("INSERT INTO dest_table VALUES(2, '2', 'Hello')")
 
     assert node2.query("SELECT COUNT() FROM dest_table") == "1\n"
 
-    node2.exec_in_container(['bash', '-c', 'cp -r /var/lib/clickhouse/shadow/1/data/default/source_table/all_1_1_0/ /var/lib/clickhouse/data/default/dest_table/detached'])
+    node2.exec_in_container(['bash', '-c',
+                             'cp -r /var/lib/clickhouse/shadow/1/data/default/source_table/all_1_1_0/ /var/lib/clickhouse/data/default/dest_table/detached'])
 
     assert node2.query("SELECT COUNT() FROM dest_table") == "1\n"
 
@@ -104,17 +110,20 @@ def test_backup_from_old_version_config(started_cluster):
     node3.query("ALTER TABLE source_table FREEZE PARTITION tuple();")
 
     def callback(n):
-        n.replace_config("/etc/clickhouse-server/merge_tree_settings.xml", "<yandex><merge_tree><enable_mixed_granularity_parts>1</enable_mixed_granularity_parts></merge_tree></yandex>")
+        n.replace_config("/etc/clickhouse-server/merge_tree_settings.xml",
+                         "<yandex><merge_tree><enable_mixed_granularity_parts>1</enable_mixed_granularity_parts></merge_tree></yandex>")
 
     node3.restart_with_latest_version(callback_onstop=callback)
 
-    node3.query("CREATE TABLE dest_table (A Int64,  B String,  Y String) ENGINE = ReplicatedMergeTree('/test/dest_table3', '1')  ORDER BY tuple() SETTINGS enable_mixed_granularity_parts = 1")
+    node3.query(
+        "CREATE TABLE dest_table (A Int64,  B String,  Y String) ENGINE = ReplicatedMergeTree('/test/dest_table3', '1')  ORDER BY tuple() SETTINGS enable_mixed_granularity_parts = 1")
 
     node3.query("INSERT INTO dest_table VALUES(2, '2', 'Hello')")
 
     assert node3.query("SELECT COUNT() FROM dest_table") == "1\n"
 
-    node3.exec_in_container(['bash', '-c', 'cp -r /var/lib/clickhouse/shadow/1/data/default/source_table/all_1_1_0/ /var/lib/clickhouse/data/default/dest_table/detached'])
+    node3.exec_in_container(['bash', '-c',
+                             'cp -r /var/lib/clickhouse/shadow/1/data/default/source_table/all_1_1_0/ /var/lib/clickhouse/data/default/dest_table/detached'])
 
     assert node3.query("SELECT COUNT() FROM dest_table") == "1\n"
 
@@ -144,7 +153,8 @@ def test_backup_and_alter(started_cluster):
 
     node4.query("ALTER TABLE backup_table DROP PARTITION tuple()")
 
-    node4.exec_in_container(['bash', '-c', 'cp -r /var/lib/clickhouse/shadow/1/data/default/backup_table/all_1_1_0/ /var/lib/clickhouse/data/default/backup_table/detached'])
+    node4.exec_in_container(['bash', '-c',
+                             'cp -r /var/lib/clickhouse/shadow/1/data/default/backup_table/all_1_1_0/ /var/lib/clickhouse/data/default/backup_table/detached'])
 
     node4.query("ALTER TABLE backup_table ATTACH PARTITION tuple()")
 
diff --git a/tests/integration/test_backward_compatibility/test.py b/tests/integration/test_backward_compatibility/test.py
index 5b51823d361..bc6d534c50f 100644
--- a/tests/integration/test_backward_compatibility/test.py
+++ b/tests/integration/test_backward_compatibility/test.py
@@ -1,22 +1,23 @@
 import pytest
 
-import helpers.client as client
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.17.8.54', stay_alive=True, with_installed_binary=True)
+node1 = cluster.add_instance('node1', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.17.8.54',
+                             stay_alive=True, with_installed_binary=True)
 node2 = cluster.add_instance('node2', with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
         cluster.start()
         for i, node in enumerate([node1, node2]):
             node.query(
-            '''CREATE TABLE t(date Date, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/t', '{}')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id'''.format(i))
+                '''CREATE TABLE t(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/t', '{}')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id'''.format(i))
 
         yield cluster
 
diff --git a/tests/integration/test_backward_compatibility/test_aggregate_function_state_avg.py b/tests/integration/test_backward_compatibility/test_aggregate_function_state_avg.py
index b1b9fecf54e..3b35c112887 100644
--- a/tests/integration/test_backward_compatibility/test_aggregate_function_state_avg.py
+++ b/tests/integration/test_backward_compatibility/test_aggregate_function_state_avg.py
@@ -1,16 +1,18 @@
 import pytest
 
-import helpers.client as client
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1',
-    with_zookeeper=False, image='yandex/clickhouse-server', tag='19.16.9.37', stay_alive=True, with_installed_binary=True)
+                             with_zookeeper=False, image='yandex/clickhouse-server', tag='19.16.9.37', stay_alive=True,
+                             with_installed_binary=True)
 node2 = cluster.add_instance('node2',
-    with_zookeeper=False, image='yandex/clickhouse-server', tag='19.16.9.37', stay_alive=True, with_installed_binary=True)
+                             with_zookeeper=False, image='yandex/clickhouse-server', tag='19.16.9.37', stay_alive=True,
+                             with_installed_binary=True)
 node3 = cluster.add_instance('node3', with_zookeeper=False)
 node4 = cluster.add_instance('node4', with_zookeeper=False)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -20,6 +22,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 # We will test that serialization of internal state of "avg" function is compatible between different versions.
 # TODO Implement versioning of serialization format for aggregate function states.
 # NOTE This test is too ad-hoc.
@@ -35,18 +38,18 @@ def test_backward_compatability(start_cluster):
     node3.query("INSERT INTO tab VALUES (3)")
     node4.query("INSERT INTO tab VALUES (4)")
 
-    assert(node1.query("SELECT avg(x) FROM remote('node{1..4}', default, tab)") == '2.5\n')
-    assert(node2.query("SELECT avg(x) FROM remote('node{1..4}', default, tab)") == '2.5\n')
-    assert(node3.query("SELECT avg(x) FROM remote('node{1..4}', default, tab)") == '2.5\n')
-    assert(node4.query("SELECT avg(x) FROM remote('node{1..4}', default, tab)") == '2.5\n')
+    assert (node1.query("SELECT avg(x) FROM remote('node{1..4}', default, tab)") == '2.5\n')
+    assert (node2.query("SELECT avg(x) FROM remote('node{1..4}', default, tab)") == '2.5\n')
+    assert (node3.query("SELECT avg(x) FROM remote('node{1..4}', default, tab)") == '2.5\n')
+    assert (node4.query("SELECT avg(x) FROM remote('node{1..4}', default, tab)") == '2.5\n')
 
     # Also check with persisted aggregate function state
 
     node1.query("create table state (x AggregateFunction(avg, UInt64)) engine = Log")
     node1.query("INSERT INTO state SELECT avgState(arrayJoin(CAST([1, 2, 3, 4] AS Array(UInt64))))")
 
-    assert(node1.query("SELECT avgMerge(x) FROM state") == '2.5\n')
+    assert (node1.query("SELECT avgMerge(x) FROM state") == '2.5\n')
 
     node1.restart_with_latest_version()
 
-    assert(node1.query("SELECT avgMerge(x) FROM state") == '2.5\n')
+    assert (node1.query("SELECT avgMerge(x) FROM state") == '2.5\n')
diff --git a/tests/integration/test_backward_compatibility/test_short_strings_aggregation.py b/tests/integration/test_backward_compatibility/test_short_strings_aggregation.py
index 5cf78b481b9..91a0a87b6e2 100644
--- a/tests/integration/test_backward_compatibility/test_short_strings_aggregation.py
+++ b/tests/integration/test_backward_compatibility/test_short_strings_aggregation.py
@@ -1,13 +1,15 @@
 import pytest
 
-import helpers.client as client
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', with_zookeeper=False, image='yandex/clickhouse-server', tag='19.16.9.37', stay_alive=True, with_installed_binary=True)
-node2 = cluster.add_instance('node2', with_zookeeper=False, image='yandex/clickhouse-server', tag='19.16.9.37', stay_alive=True, with_installed_binary=True)
+node1 = cluster.add_instance('node1', with_zookeeper=False, image='yandex/clickhouse-server', tag='19.16.9.37',
+                             stay_alive=True, with_installed_binary=True)
+node2 = cluster.add_instance('node2', with_zookeeper=False, image='yandex/clickhouse-server', tag='19.16.9.37',
+                             stay_alive=True, with_installed_binary=True)
 node3 = cluster.add_instance('node3', with_zookeeper=False)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -23,6 +25,7 @@ def test_backward_compatability(start_cluster):
     node2.query("create table tab (s String) engine = MergeTree order by s")
     node1.query("insert into tab select number from numbers(50)")
     node2.query("insert into tab select number from numbers(1000000)")
-    res = node3.query("select s, count() from remote('node{1,2}', default, tab) group by s order by toUInt64(s) limit 50")
+    res = node3.query(
+        "select s, count() from remote('node{1,2}', default, tab) group by s order by toUInt64(s) limit 50")
     print(res)
     assert res == ''.join('{}\t2\n'.format(i) for i in range(50))
diff --git a/tests/integration/test_block_structure_mismatch/test.py b/tests/integration/test_block_structure_mismatch/test.py
index fa9272b8401..12f9bd090a3 100644
--- a/tests/integration/test_block_structure_mismatch/test.py
+++ b/tests/integration/test_block_structure_mismatch/test.py
@@ -1,7 +1,5 @@
-import time
 import pytest
 
-from contextlib import contextmanager
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
@@ -9,7 +7,8 @@ cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'])
 node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'])
 
-#test reproducing issue https://github.com/ClickHouse/ClickHouse/issues/3162
+
+# test reproducing issue https://github.com/ClickHouse/ClickHouse/issues/3162
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -44,7 +43,9 @@ CREATE TABLE dist_test (
     finally:
         cluster.shutdown()
 
+
 def test(started_cluster):
     node1.query("INSERT INTO local_test (t, shard, col1, col2) VALUES (1000, 0, 'x', 'y')")
     node2.query("INSERT INTO local_test (t, shard, col1, col2) VALUES (1000, 1, 'foo', 'bar')")
-    assert node1.query("SELECT col1, col2 FROM dist_test WHERE (t < 3600000) AND (col1 = 'foo') ORDER BY t ASC") == "foo\tbar\n"
+    assert node1.query(
+        "SELECT col1, col2 FROM dist_test WHERE (t < 3600000) AND (col1 = 'foo') ORDER BY t ASC") == "foo\tbar\n"
diff --git a/tests/integration/test_check_table/test.py b/tests/integration/test_check_table/test.py
index 83df59b44a0..e57235502d3 100644
--- a/tests/integration/test_check_table/test.py
+++ b/tests/integration/test_check_table/test.py
@@ -1,9 +1,6 @@
-import time
-
 import pytest
 
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
@@ -34,15 +31,22 @@ def started_cluster():
 
 
 def corrupt_data_part_on_disk(node, table, part_name):
-    part_path = node.query("SELECT path FROM system.parts WHERE table = '{}' and name = '{}'".format(table, part_name)).strip()
-    node.exec_in_container(['bash', '-c', 'cd {p} && ls *.bin | head -n 1 | xargs -I{{}} sh -c \'echo "1" >> $1\' -- {{}}'.format(p=part_path)], privileged=True)
+    part_path = node.query(
+        "SELECT path FROM system.parts WHERE table = '{}' and name = '{}'".format(table, part_name)).strip()
+    node.exec_in_container(['bash', '-c',
+                            'cd {p} && ls *.bin | head -n 1 | xargs -I{{}} sh -c \'echo "1" >> $1\' -- {{}}'.format(
+                                p=part_path)], privileged=True)
+
 
 def remove_checksums_on_disk(node, table, part_name):
-    part_path = node.query("SELECT path FROM system.parts WHERE table = '{}' and name = '{}'".format(table, part_name)).strip()
+    part_path = node.query(
+        "SELECT path FROM system.parts WHERE table = '{}' and name = '{}'".format(table, part_name)).strip()
     node.exec_in_container(['bash', '-c', 'rm -r {p}/checksums.txt'.format(p=part_path)], privileged=True)
 
+
 def remove_part_from_disk(node, table, part_name):
-    part_path = node.query("SELECT path FROM system.parts WHERE table = '{}' and name = '{}'".format(table, part_name)).strip()
+    part_path = node.query(
+        "SELECT path FROM system.parts WHERE table = '{}' and name = '{}'".format(table, part_name)).strip()
     if not part_path:
         raise Exception("Part " + part_name + "doesn't exist")
     node.exec_in_container(['bash', '-c', 'rm -r {p}/*'.format(p=part_path)], privileged=True)
@@ -50,35 +54,42 @@ def remove_part_from_disk(node, table, part_name):
 
 def test_check_normal_table_corruption(started_cluster):
     node1.query("INSERT INTO non_replicated_mt VALUES (toDate('2019-02-01'), 1, 10), (toDate('2019-02-01'), 2, 12)")
-    assert node1.query("CHECK TABLE non_replicated_mt PARTITION 201902", settings={"check_query_single_value_result": 0}) == "201902_1_1_0\t1\t\n"
+    assert node1.query("CHECK TABLE non_replicated_mt PARTITION 201902",
+                       settings={"check_query_single_value_result": 0}) == "201902_1_1_0\t1\t\n"
 
     remove_checksums_on_disk(node1, "non_replicated_mt", "201902_1_1_0")
 
-    assert node1.query("CHECK TABLE non_replicated_mt", settings={"check_query_single_value_result": 0}).strip() == "201902_1_1_0\t1\tChecksums recounted and written to disk."
+    assert node1.query("CHECK TABLE non_replicated_mt", settings={
+        "check_query_single_value_result": 0}).strip() == "201902_1_1_0\t1\tChecksums recounted and written to disk."
 
     assert node1.query("SELECT COUNT() FROM non_replicated_mt") == "2\n"
 
     remove_checksums_on_disk(node1, "non_replicated_mt", "201902_1_1_0")
 
-    assert node1.query("CHECK TABLE non_replicated_mt PARTITION 201902", settings={"check_query_single_value_result": 0}).strip() == "201902_1_1_0\t1\tChecksums recounted and written to disk."
+    assert node1.query("CHECK TABLE non_replicated_mt PARTITION 201902", settings={
+        "check_query_single_value_result": 0}).strip() == "201902_1_1_0\t1\tChecksums recounted and written to disk."
 
     assert node1.query("SELECT COUNT() FROM non_replicated_mt") == "2\n"
 
     corrupt_data_part_on_disk(node1, "non_replicated_mt", "201902_1_1_0")
 
-    assert node1.query("CHECK TABLE non_replicated_mt", settings={"check_query_single_value_result": 0}).strip() == "201902_1_1_0\t0\tCannot read all data. Bytes read: 2. Bytes expected: 16."
+    assert node1.query("CHECK TABLE non_replicated_mt", settings={
+        "check_query_single_value_result": 0}).strip() == "201902_1_1_0\t0\tCannot read all data. Bytes read: 2. Bytes expected: 16."
 
-    assert node1.query("CHECK TABLE non_replicated_mt", settings={"check_query_single_value_result": 0}).strip() == "201902_1_1_0\t0\tCannot read all data. Bytes read: 2. Bytes expected: 16."
+    assert node1.query("CHECK TABLE non_replicated_mt", settings={
+        "check_query_single_value_result": 0}).strip() == "201902_1_1_0\t0\tCannot read all data. Bytes read: 2. Bytes expected: 16."
 
     node1.query("INSERT INTO non_replicated_mt VALUES (toDate('2019-01-01'), 1, 10), (toDate('2019-01-01'), 2, 12)")
 
-    assert node1.query("CHECK TABLE non_replicated_mt PARTITION 201901", settings={"check_query_single_value_result": 0}) == "201901_2_2_0\t1\t\n"
+    assert node1.query("CHECK TABLE non_replicated_mt PARTITION 201901",
+                       settings={"check_query_single_value_result": 0}) == "201901_2_2_0\t1\t\n"
 
     corrupt_data_part_on_disk(node1, "non_replicated_mt", "201901_2_2_0")
 
     remove_checksums_on_disk(node1, "non_replicated_mt", "201901_2_2_0")
 
-    assert node1.query("CHECK TABLE non_replicated_mt PARTITION 201901", settings={"check_query_single_value_result": 0}) == "201901_2_2_0\t0\tCheck of part finished with error: \\'Cannot read all data. Bytes read: 2. Bytes expected: 16.\\'\n"
+    assert node1.query("CHECK TABLE non_replicated_mt PARTITION 201901", settings={
+        "check_query_single_value_result": 0}) == "201901_2_2_0\t0\tCheck of part finished with error: \\'Cannot read all data. Bytes read: 2. Bytes expected: 16.\\'\n"
 
 
 def test_check_replicated_table_simple(started_cluster):
@@ -90,16 +101,20 @@ def test_check_replicated_table_simple(started_cluster):
     assert node1.query("SELECT count() from replicated_mt") == "2\n"
     assert node2.query("SELECT count() from replicated_mt") == "2\n"
 
-    assert node1.query("CHECK TABLE replicated_mt", settings={"check_query_single_value_result": 0}) == "201902_0_0_0\t1\t\n"
-    assert node2.query("CHECK TABLE replicated_mt", settings={"check_query_single_value_result": 0}) == "201902_0_0_0\t1\t\n"
+    assert node1.query("CHECK TABLE replicated_mt",
+                       settings={"check_query_single_value_result": 0}) == "201902_0_0_0\t1\t\n"
+    assert node2.query("CHECK TABLE replicated_mt",
+                       settings={"check_query_single_value_result": 0}) == "201902_0_0_0\t1\t\n"
 
     node2.query("INSERT INTO replicated_mt VALUES (toDate('2019-01-02'), 3, 10), (toDate('2019-01-02'), 4, 12)")
     node1.query("SYSTEM SYNC REPLICA replicated_mt")
     assert node1.query("SELECT count() from replicated_mt") == "4\n"
     assert node2.query("SELECT count() from replicated_mt") == "4\n"
 
-    assert node1.query("CHECK TABLE replicated_mt PARTITION 201901", settings={"check_query_single_value_result": 0}) == "201901_0_0_0\t1\t\n"
-    assert node2.query("CHECK TABLE replicated_mt PARTITION 201901", settings={"check_query_single_value_result": 0}) == "201901_0_0_0\t1\t\n"
+    assert node1.query("CHECK TABLE replicated_mt PARTITION 201901",
+                       settings={"check_query_single_value_result": 0}) == "201901_0_0_0\t1\t\n"
+    assert node2.query("CHECK TABLE replicated_mt PARTITION 201901",
+                       settings={"check_query_single_value_result": 0}) == "201901_0_0_0\t1\t\n"
 
 
 def test_check_replicated_table_corruption(started_cluster):
@@ -112,18 +127,25 @@ def test_check_replicated_table_corruption(started_cluster):
     assert node1.query("SELECT count() from replicated_mt") == "4\n"
     assert node2.query("SELECT count() from replicated_mt") == "4\n"
 
-    part_name = node1.query("SELECT name from system.parts where table = 'replicated_mt' and partition_id = '201901' and active = 1").strip()
+    part_name = node1.query(
+        "SELECT name from system.parts where table = 'replicated_mt' and partition_id = '201901' and active = 1").strip()
 
     corrupt_data_part_on_disk(node1, "replicated_mt", part_name)
-    assert node1.query("CHECK TABLE replicated_mt PARTITION 201901", settings={"check_query_single_value_result": 0}) == "{p}\t0\tPart {p} looks broken. Removing it and queueing a fetch.\n".format(p=part_name)
+    assert node1.query("CHECK TABLE replicated_mt PARTITION 201901", settings={
+        "check_query_single_value_result": 0}) == "{p}\t0\tPart {p} looks broken. Removing it and queueing a fetch.\n".format(
+        p=part_name)
 
     node1.query("SYSTEM SYNC REPLICA replicated_mt")
-    assert node1.query("CHECK TABLE replicated_mt PARTITION 201901", settings={"check_query_single_value_result": 0}) == "{}\t1\t\n".format(part_name)
+    assert node1.query("CHECK TABLE replicated_mt PARTITION 201901",
+                       settings={"check_query_single_value_result": 0}) == "{}\t1\t\n".format(part_name)
     assert node1.query("SELECT count() from replicated_mt") == "4\n"
 
     remove_part_from_disk(node2, "replicated_mt", part_name)
-    assert node2.query("CHECK TABLE replicated_mt PARTITION 201901", settings={"check_query_single_value_result": 0}) == "{p}\t0\tPart {p} looks broken. Removing it and queueing a fetch.\n".format(p=part_name)
+    assert node2.query("CHECK TABLE replicated_mt PARTITION 201901", settings={
+        "check_query_single_value_result": 0}) == "{p}\t0\tPart {p} looks broken. Removing it and queueing a fetch.\n".format(
+        p=part_name)
 
     node1.query("SYSTEM SYNC REPLICA replicated_mt")
-    assert node1.query("CHECK TABLE replicated_mt PARTITION 201901", settings={"check_query_single_value_result": 0}) == "{}\t1\t\n".format(part_name)
+    assert node1.query("CHECK TABLE replicated_mt PARTITION 201901",
+                       settings={"check_query_single_value_result": 0}) == "{}\t1\t\n".format(part_name)
     assert node1.query("SELECT count() from replicated_mt") == "4\n"
diff --git a/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py b/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
index ab2db469157..71850ee7318 100644
--- a/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
+++ b/tests/integration/test_cleanup_dir_after_bad_zk_conn/test.py
@@ -1,13 +1,13 @@
 import time
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
 
-
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -16,6 +16,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 # This tests if the data directory for a table is cleaned up if there is a Zookeeper
 # connection exception during a CreateQuery operation involving ReplicatedMergeTree tables.
 # Test flow is as follows:
@@ -48,20 +49,30 @@ def test_cleanup_dir_after_bad_zk_conn(start_cluster):
     node1.query('''INSERT INTO replica.test VALUES (1, now())''')
     assert "1\n" in node1.query('''SELECT count() from replica.test FORMAT TSV''')
 
+
 def test_cleanup_dir_after_wrong_replica_name(start_cluster):
-    node1.query("CREATE TABLE test2_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r1') ORDER BY n")
-    error = node1.query_and_get_error("CREATE TABLE test2_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r1') ORDER BY n")
+    node1.query(
+        "CREATE TABLE test2_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r1') ORDER BY n")
+    error = node1.query_and_get_error(
+        "CREATE TABLE test2_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r1') ORDER BY n")
     assert "already exists" in error
-    node1.query("CREATE TABLE test_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r2') ORDER BY n")
+    node1.query(
+        "CREATE TABLE test_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test2/', 'r2') ORDER BY n")
+
 
 def test_cleanup_dir_after_wrong_zk_path(start_cluster):
-    node1.query("CREATE TABLE test3_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test3/', 'r1') ORDER BY n")
-    error = node1.query_and_get_error("CREATE TABLE test3_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/', 'r2') ORDER BY n")
+    node1.query(
+        "CREATE TABLE test3_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test3/', 'r1') ORDER BY n")
+    error = node1.query_and_get_error(
+        "CREATE TABLE test3_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/', 'r2') ORDER BY n")
     assert "Cannot create" in error
-    node1.query("CREATE TABLE test3_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test3/', 'r2') ORDER BY n")
+    node1.query(
+        "CREATE TABLE test3_r2 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test3/', 'r2') ORDER BY n")
+
 
 def test_attach_without_zk(start_cluster):
-    node1.query("CREATE TABLE test4_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test4/', 'r1') ORDER BY n")
+    node1.query(
+        "CREATE TABLE test4_r1 (n UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test4/', 'r1') ORDER BY n")
     node1.query("DETACH TABLE test4_r1")
     with PartitionManager() as pm:
         pm._add_rule({'probability': 0.5, 'source': node1.ip_address, 'destination_port': 2181, 'action': 'DROP'})
diff --git a/tests/integration/test_cluster_all_replicas/test.py b/tests/integration/test_cluster_all_replicas/test.py
index 0af5693fc75..7cb170ce52a 100644
--- a/tests/integration/test_cluster_all_replicas/test.py
+++ b/tests/integration/test_cluster_all_replicas/test.py
@@ -7,6 +7,7 @@ cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
diff --git a/tests/integration/test_cluster_copier/test.py b/tests/integration/test_cluster_copier/test.py
index 3f9ca8a053c..2a9e696ca46 100644
--- a/tests/integration/test_cluster_copier/test.py
+++ b/tests/integration/test_cluster_copier/test.py
@@ -1,15 +1,15 @@
 import os
+import random
 import sys
 import time
+from contextlib import contextmanager
+
+import docker
 import kazoo
 import pytest
-import docker
-import random
-from contextlib import contextmanager
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
-
 CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
 sys.path.insert(0, os.path.dirname(CURRENT_TEST_DIR))
 
@@ -18,9 +18,10 @@ MOVING_FAIL_PROBABILITY = 0.2
 
 cluster = ClickHouseCluster(__file__)
 
+
 def check_all_hosts_sucesfully_executed(tsv_content, num_hosts):
     M = TSV.toMat(tsv_content)
-    hosts = [(l[0], l[1]) for l in M] # (host, port)
+    hosts = [(l[0], l[1]) for l in M]  # (host, port)
     codes = [l[2] for l in M]
 
     assert len(hosts) == num_hosts and len(set(hosts)) == num_hosts, "\n" + tsv_content
@@ -39,14 +40,14 @@ def started_cluster():
     global cluster
     try:
         clusters_schema = {
-         "0" : {
-            "0" : ["0", "1"],
-            "1" : ["0"]
-         },
-         "1" : {
-            "0" : ["0", "1"],
-            "1" : ["0"]
-         }
+            "0": {
+                "0": ["0", "1"],
+                "1": ["0"]
+            },
+            "1": {
+                "0": ["0", "1"],
+                "1": ["0"]
+            }
         }
 
         for cluster_name, shards in clusters_schema.iteritems():
@@ -54,10 +55,11 @@ def started_cluster():
                 for replica_name in replicas:
                     name = "s{}_{}_{}".format(cluster_name, shard_name, replica_name)
                     cluster.add_instance(name,
-                        main_configs=["configs/conf.d/query_log.xml", "configs/conf.d/ddl.xml", "configs/conf.d/clusters.xml"],
-                        user_configs=["configs/users.xml"],
-                        macros={"cluster": cluster_name, "shard": shard_name, "replica": replica_name},
-                        with_zookeeper=True)
+                                         main_configs=["configs/conf.d/query_log.xml", "configs/conf.d/ddl.xml",
+                                                       "configs/conf.d/clusters.xml"],
+                                         user_configs=["configs/users.xml"],
+                                         macros={"cluster": cluster_name, "shard": shard_name, "replica": replica_name},
+                                         with_zookeeper=True)
 
         cluster.start()
         yield cluster
@@ -70,24 +72,27 @@ class Task1:
 
     def __init__(self, cluster):
         self.cluster = cluster
-        self.zk_task_path="/clickhouse-copier/task_simple"
+        self.zk_task_path = "/clickhouse-copier/task_simple"
         self.copier_task_config = open(os.path.join(CURRENT_TEST_DIR, 'task0_description.xml'), 'r').read()
 
-
     def start(self):
         instance = cluster.instances['s0_0_0']
 
         for cluster_num in ["0", "1"]:
             ddl_check_query(instance, "DROP DATABASE IF EXISTS default ON CLUSTER cluster{}".format(cluster_num))
-            ddl_check_query(instance, "CREATE DATABASE IF NOT EXISTS default ON CLUSTER cluster{} ENGINE=Ordinary".format(cluster_num))
+            ddl_check_query(instance,
+                            "CREATE DATABASE IF NOT EXISTS default ON CLUSTER cluster{} ENGINE=Ordinary".format(
+                                cluster_num))
 
         ddl_check_query(instance, "CREATE TABLE hits ON CLUSTER cluster0 (d UInt64, d1 UInt64 MATERIALIZED d+1) " +
-                                  "ENGINE=ReplicatedMergeTree('/clickhouse/tables/cluster_{cluster}/{shard}/hits', '{replica}') " +
-                                  "PARTITION BY d % 3 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16")
-        ddl_check_query(instance, "CREATE TABLE hits_all ON CLUSTER cluster0 (d UInt64) ENGINE=Distributed(cluster0, default, hits, d)")
-        ddl_check_query(instance, "CREATE TABLE hits_all ON CLUSTER cluster1 (d UInt64) ENGINE=Distributed(cluster1, default, hits, d + 1)")
-        instance.query("INSERT INTO hits_all SELECT * FROM system.numbers LIMIT 1002", settings={"insert_distributed_sync": 1})
-
+                        "ENGINE=ReplicatedMergeTree('/clickhouse/tables/cluster_{cluster}/{shard}/hits', '{replica}') " +
+                        "PARTITION BY d % 3 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16")
+        ddl_check_query(instance,
+                        "CREATE TABLE hits_all ON CLUSTER cluster0 (d UInt64) ENGINE=Distributed(cluster0, default, hits, d)")
+        ddl_check_query(instance,
+                        "CREATE TABLE hits_all ON CLUSTER cluster1 (d UInt64) ENGINE=Distributed(cluster1, default, hits, d + 1)")
+        instance.query("INSERT INTO hits_all SELECT * FROM system.numbers LIMIT 1002",
+                       settings={"insert_distributed_sync": 1})
 
     def check(self):
         assert TSV(self.cluster.instances['s0_0_0'].query("SELECT count() FROM hits_all")) == TSV("1002\n")
@@ -107,31 +112,44 @@ class Task2:
 
     def __init__(self, cluster):
         self.cluster = cluster
-        self.zk_task_path="/clickhouse-copier/task_month_to_week_partition"
+        self.zk_task_path = "/clickhouse-copier/task_month_to_week_partition"
         self.copier_task_config = open(os.path.join(CURRENT_TEST_DIR, 'task_month_to_week_description.xml'), 'r').read()
 
-
     def start(self):
         instance = cluster.instances['s0_0_0']
 
         for cluster_num in ["0", "1"]:
             ddl_check_query(instance, "DROP DATABASE IF EXISTS default ON CLUSTER cluster{}".format(cluster_num))
-            ddl_check_query(instance, "CREATE DATABASE IF NOT EXISTS default ON CLUSTER cluster{} ENGINE=Ordinary".format(cluster_num))
+            ddl_check_query(instance,
+                            "CREATE DATABASE IF NOT EXISTS default ON CLUSTER cluster{} ENGINE=Ordinary".format(
+                                cluster_num))
 
-        ddl_check_query(instance, "CREATE TABLE a ON CLUSTER cluster0 (date Date, d UInt64, d1 UInt64 ALIAS d+1) ENGINE=ReplicatedMergeTree('/clickhouse/tables/cluster_{cluster}/{shard}/a', '{replica}', date, intHash64(d), (date, intHash64(d)), 8192)")
-        ddl_check_query(instance, "CREATE TABLE a_all ON CLUSTER cluster0 (date Date, d UInt64) ENGINE=Distributed(cluster0, default, a, d)")
+        ddl_check_query(instance,
+                        "CREATE TABLE a ON CLUSTER cluster0 (date Date, d UInt64, d1 UInt64 ALIAS d+1) ENGINE=ReplicatedMergeTree('/clickhouse/tables/cluster_{cluster}/{shard}/a', '{replica}', date, intHash64(d), (date, intHash64(d)), 8192)")
+        ddl_check_query(instance,
+                        "CREATE TABLE a_all ON CLUSTER cluster0 (date Date, d UInt64) ENGINE=Distributed(cluster0, default, a, d)")
 
-        instance.query("INSERT INTO a_all SELECT toDate(17581 + number) AS date, number AS d FROM system.numbers LIMIT 85", settings={"insert_distributed_sync": 1})
+        instance.query(
+            "INSERT INTO a_all SELECT toDate(17581 + number) AS date, number AS d FROM system.numbers LIMIT 85",
+            settings={"insert_distributed_sync": 1})
 
     def check(self):
-        assert TSV(self.cluster.instances['s0_0_0'].query("SELECT count() FROM cluster(cluster0, default, a)")) == TSV("85\n")
-        assert TSV(self.cluster.instances['s1_0_0'].query("SELECT count(), uniqExact(date) FROM cluster(cluster1, default, b)")) == TSV("85\t85\n")
+        assert TSV(self.cluster.instances['s0_0_0'].query("SELECT count() FROM cluster(cluster0, default, a)")) == TSV(
+            "85\n")
+        assert TSV(self.cluster.instances['s1_0_0'].query(
+            "SELECT count(), uniqExact(date) FROM cluster(cluster1, default, b)")) == TSV("85\t85\n")
 
-        assert TSV(self.cluster.instances['s1_0_0'].query("SELECT DISTINCT jumpConsistentHash(intHash64(d), 2) FROM b")) == TSV("0\n")
-        assert TSV(self.cluster.instances['s1_1_0'].query("SELECT DISTINCT jumpConsistentHash(intHash64(d), 2) FROM b")) == TSV("1\n")
+        assert TSV(self.cluster.instances['s1_0_0'].query(
+            "SELECT DISTINCT jumpConsistentHash(intHash64(d), 2) FROM b")) == TSV("0\n")
+        assert TSV(self.cluster.instances['s1_1_0'].query(
+            "SELECT DISTINCT jumpConsistentHash(intHash64(d), 2) FROM b")) == TSV("1\n")
 
-        assert TSV(self.cluster.instances['s1_0_0'].query("SELECT uniqExact(partition) IN (12, 13) FROM system.parts WHERE active AND database='default' AND table='b'")) == TSV("1\n")
-        assert TSV(self.cluster.instances['s1_1_0'].query("SELECT uniqExact(partition) IN (12, 13) FROM system.parts WHERE active AND database='default' AND table='b'")) == TSV("1\n")
+        assert TSV(self.cluster.instances['s1_0_0'].query(
+            "SELECT uniqExact(partition) IN (12, 13) FROM system.parts WHERE active AND database='default' AND table='b'")) == TSV(
+            "1\n")
+        assert TSV(self.cluster.instances['s1_1_0'].query(
+            "SELECT uniqExact(partition) IN (12, 13) FROM system.parts WHERE active AND database='default' AND table='b'")) == TSV(
+            "1\n")
 
         instance = cluster.instances['s0_0_0']
         ddl_check_query(instance, "DROP TABLE a ON CLUSTER cluster0")
@@ -142,11 +160,10 @@ class Task_test_block_size:
 
     def __init__(self, cluster):
         self.cluster = cluster
-        self.zk_task_path="/clickhouse-copier/task_test_block_size"
+        self.zk_task_path = "/clickhouse-copier/task_test_block_size"
         self.copier_task_config = open(os.path.join(CURRENT_TEST_DIR, 'task_test_block_size.xml'), 'r').read()
         self.rows = 1000000
 
-
     def start(self):
         instance = cluster.instances['s0_0_0']
 
@@ -155,11 +172,13 @@ class Task_test_block_size:
             ENGINE=ReplicatedMergeTree('/clickhouse/tables/cluster_{cluster}/{shard}/test_block_size', '{replica}')
             ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d)""", 2)
 
-        instance.query("INSERT INTO test_block_size SELECT toDate(0) AS partition, number as d FROM system.numbers LIMIT {}".format(self.rows))
-
+        instance.query(
+            "INSERT INTO test_block_size SELECT toDate(0) AS partition, number as d FROM system.numbers LIMIT {}".format(
+                self.rows))
 
     def check(self):
-        assert TSV(self.cluster.instances['s1_0_0'].query("SELECT count() FROM cluster(cluster1, default, test_block_size)")) == TSV("{}\n".format(self.rows))
+        assert TSV(self.cluster.instances['s1_0_0'].query(
+            "SELECT count() FROM cluster(cluster1, default, test_block_size)")) == TSV("{}\n".format(self.rows))
 
         instance = cluster.instances['s0_0_0']
         ddl_check_query(instance, "DROP TABLE test_block_size ON CLUSTER shard_0_0", 2)
@@ -170,17 +189,15 @@ class Task_no_index:
 
     def __init__(self, cluster):
         self.cluster = cluster
-        self.zk_task_path="/clickhouse-copier/task_no_index"
+        self.zk_task_path = "/clickhouse-copier/task_no_index"
         self.copier_task_config = open(os.path.join(CURRENT_TEST_DIR, 'task_no_index.xml'), 'r').read()
         self.rows = 1000000
 
-
     def start(self):
         instance = cluster.instances['s0_0_0']
         instance.query("create table ontime (Year UInt16, FlightDate String) ENGINE = Memory")
         instance.query("insert into ontime values (2016, 'test6'), (2017, 'test7'), (2018, 'test8')")
 
-
     def check(self):
         assert TSV(self.cluster.instances['s1_1_0'].query("SELECT Year FROM ontime22")) == TSV("2017\n")
         instance = cluster.instances['s0_0_0']
@@ -193,17 +210,16 @@ class Task_no_arg:
 
     def __init__(self, cluster):
         self.cluster = cluster
-        self.zk_task_path="/clickhouse-copier/task_no_arg"
+        self.zk_task_path = "/clickhouse-copier/task_no_arg"
         self.copier_task_config = open(os.path.join(CURRENT_TEST_DIR, 'task_no_arg.xml'), 'r').read()
         self.rows = 1000000
 
-
     def start(self):
         instance = cluster.instances['s0_0_0']
-        instance.query("create table copier_test1 (date Date, id UInt32) engine = MergeTree PARTITION BY date ORDER BY date SETTINGS index_granularity = 8192")
+        instance.query(
+            "create table copier_test1 (date Date, id UInt32) engine = MergeTree PARTITION BY date ORDER BY date SETTINGS index_granularity = 8192")
         instance.query("insert into copier_test1 values ('2016-01-01', 10);")
 
-
     def check(self):
         assert TSV(self.cluster.instances['s1_1_0'].query("SELECT date FROM copier_test1_1")) == TSV("2016-01-01\n")
         instance = cluster.instances['s0_0_0']
@@ -227,15 +243,14 @@ def execute_task(task, cmd_options):
     zk.ensure_path(zk_task_path)
     zk.create(zk_task_path + "/description", task.copier_task_config)
 
-
     # Run cluster-copier processes on each node
     docker_api = docker.from_env().api
     copiers_exec_ids = []
 
     cmd = ['/usr/bin/clickhouse', 'copier',
-        '--config', '/etc/clickhouse-server/config-copier.xml',
-        '--task-path', zk_task_path,
-        '--base-dir', '/var/log/clickhouse-server/copier']
+           '--config', '/etc/clickhouse-server/config-copier.xml',
+           '--task-path', zk_task_path,
+           '--base-dir', '/var/log/clickhouse-server/copier']
     cmd += cmd_options
 
     copiers = random.sample(cluster.instances.keys(), 3)
@@ -243,7 +258,8 @@ def execute_task(task, cmd_options):
     for instance_name in copiers:
         instance = cluster.instances[instance_name]
         container = instance.get_docker_handle()
-        instance.copy_file_to_container(os.path.join(CURRENT_TEST_DIR, "configs/config-copier.xml"), "/etc/clickhouse-server/config-copier.xml")
+        instance.copy_file_to_container(os.path.join(CURRENT_TEST_DIR, "configs/config-copier.xml"),
+                                        "/etc/clickhouse-server/config-copier.xml")
         print "Copied copier config to {}".format(instance.name)
         exec_id = docker_api.exec_create(container.id, cmd, stderr=True)
         output = docker_api.exec_start(exec_id).decode('utf8')
@@ -277,7 +293,6 @@ def execute_task(task, cmd_options):
         True
     ]
 )
-
 def test_copy_simple(started_cluster, use_sample_offset):
     if use_sample_offset:
         execute_task(Task1(started_cluster), ['--experimental-use-sample-offset', '1'])
@@ -292,7 +307,6 @@ def test_copy_simple(started_cluster, use_sample_offset):
         True
     ]
 )
-
 def test_copy_with_recovering(started_cluster, use_sample_offset):
     if use_sample_offset:
         execute_task(Task1(started_cluster), ['--copy-fault-probability', str(COPYING_FAIL_PROBABILITY),
@@ -300,6 +314,7 @@ def test_copy_with_recovering(started_cluster, use_sample_offset):
     else:
         execute_task(Task1(started_cluster), ['--copy-fault-probability', str(COPYING_FAIL_PROBABILITY)])
 
+
 @pytest.mark.parametrize(
     ('use_sample_offset'),
     [
@@ -307,7 +322,6 @@ def test_copy_with_recovering(started_cluster, use_sample_offset):
         True
     ]
 )
-
 def test_copy_with_recovering_after_move_faults(started_cluster, use_sample_offset):
     if use_sample_offset:
         execute_task(Task1(started_cluster), ['--move-fault-probability', str(MOVING_FAIL_PROBABILITY),
@@ -315,29 +329,36 @@ def test_copy_with_recovering_after_move_faults(started_cluster, use_sample_offs
     else:
         execute_task(Task1(started_cluster), ['--move-fault-probability', str(MOVING_FAIL_PROBABILITY)])
 
+
 @pytest.mark.timeout(600)
 def test_copy_month_to_week_partition(started_cluster):
     execute_task(Task2(started_cluster), [])
 
+
 @pytest.mark.timeout(600)
 def test_copy_month_to_week_partition_with_recovering(started_cluster):
     execute_task(Task2(started_cluster), ['--copy-fault-probability', str(COPYING_FAIL_PROBABILITY)])
 
+
 @pytest.mark.timeout(600)
 def test_copy_month_to_week_partition_with_recovering_after_move_faults(started_cluster):
     execute_task(Task2(started_cluster), ['--move-fault-probability', str(MOVING_FAIL_PROBABILITY)])
 
+
 def test_block_size(started_cluster):
     execute_task(Task_test_block_size(started_cluster), [])
 
+
 def test_no_index(started_cluster):
     execute_task(Task_no_index(started_cluster), [])
 
+
 def test_no_arg(started_cluster):
     execute_task(Task_no_arg(started_cluster), [])
 
+
 if __name__ == '__main__':
     with contextmanager(started_cluster)() as cluster:
-       for name, instance in cluster.instances.items():
-           print name, instance.ip_address
-       raw_input("Cluster created, press any key to destroy...")
+        for name, instance in cluster.instances.items():
+            print name, instance.ip_address
+        raw_input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_cluster_copier/trivial_test.py b/tests/integration/test_cluster_copier/trivial_test.py
index 1697f8bbdfa..3d0c5d0f5b0 100644
--- a/tests/integration/test_cluster_copier/trivial_test.py
+++ b/tests/integration/test_cluster_copier/trivial_test.py
@@ -1,13 +1,10 @@
 import os
-import os.path as p
 import sys
 import time
-import datetime
-import pytest
 from contextlib import contextmanager
-import docker
-from kazoo.client import KazooClient
 
+import docker
+import pytest
 
 CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
 sys.path.insert(0, os.path.dirname(CURRENT_TEST_DIR))
@@ -18,13 +15,14 @@ COPYING_FAIL_PROBABILITY = 0.33
 MOVING_FAIL_PROBABILITY = 0.1
 cluster = None
 
+
 @pytest.fixture(scope="function")
 def started_cluster():
     global cluster
     try:
         clusters_schema = {
-            "0" : {"0" : ["0"]},
-            "1" : {"0" : ["0"]}
+            "0": {"0": ["0"]},
+            "1": {"0": ["0"]}
         }
 
         cluster = ClickHouseCluster(__file__)
@@ -50,12 +48,11 @@ class TaskTrivial:
     def __init__(self, cluster, use_sample_offset):
         self.cluster = cluster
         if use_sample_offset:
-            self.zk_task_path="/clickhouse-copier/task_trivial_use_sample_offset"
+            self.zk_task_path = "/clickhouse-copier/task_trivial_use_sample_offset"
         else:
-            self.zk_task_path="/clickhouse-copier/task_trivial"
+            self.zk_task_path = "/clickhouse-copier/task_trivial"
         self.copier_task_config = open(os.path.join(CURRENT_TEST_DIR, 'task_trivial.xml'), 'r').read()
 
-
     def start(self):
         source = cluster.instances['s0_0_0']
         destination = cluster.instances['s1_0_0']
@@ -68,8 +65,8 @@ class TaskTrivial:
                      "ENGINE=ReplicatedMergeTree('/clickhouse/tables/source_trivial_cluster/1/trivial', '1') "
                      "PARTITION BY d % 5 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16")
 
-        source.query("INSERT INTO trivial SELECT * FROM system.numbers LIMIT 1002", settings={"insert_distributed_sync": 1})
-
+        source.query("INSERT INTO trivial SELECT * FROM system.numbers LIMIT 1002",
+                     settings={"insert_distributed_sync": 1})
 
     def check(self):
         source = cluster.instances['s0_0_0']
@@ -138,7 +135,6 @@ def execute_task(task, cmd_options):
         True
     ]
 )
-
 def test_trivial_copy(started_cluster, use_sample_offset):
     if use_sample_offset:
         execute_task(TaskTrivial(started_cluster, use_sample_offset), ['--experimental-use-sample-offset', '1'])
@@ -146,6 +142,7 @@ def test_trivial_copy(started_cluster, use_sample_offset):
         print("AAAAA")
         execute_task(TaskTrivial(started_cluster, use_sample_offset), [])
 
+
 @pytest.mark.parametrize(
     ('use_sample_offset'),
     [
@@ -153,7 +150,6 @@ def test_trivial_copy(started_cluster, use_sample_offset):
         True
     ]
 )
-
 def test_trivial_copy_with_copy_fault(started_cluster, use_sample_offset):
     if use_sample_offset:
         execute_task(TaskTrivial(started_cluster), ['--copy-fault-probability', str(COPYING_FAIL_PROBABILITY),
@@ -161,6 +157,7 @@ def test_trivial_copy_with_copy_fault(started_cluster, use_sample_offset):
     else:
         execute_task(TaskTrivial(started_cluster), ['--copy-fault-probability', str(COPYING_FAIL_PROBABILITY)])
 
+
 @pytest.mark.parametrize(
     ('use_sample_offset'),
     [
@@ -168,7 +165,6 @@ def test_trivial_copy_with_copy_fault(started_cluster, use_sample_offset):
         True
     ]
 )
-
 def test_trivial_copy_with_move_fault(started_cluster, use_sample_offset):
     if use_sample_offset:
         execute_task(TaskTrivial(started_cluster), ['--move-fault-probability', str(MOVING_FAIL_PROBABILITY),
diff --git a/tests/integration/test_concurrent_queries_for_user_restriction/test.py b/tests/integration/test_concurrent_queries_for_user_restriction/test.py
index 4b7cc87c15a..e287eb763ce 100644
--- a/tests/integration/test_concurrent_queries_for_user_restriction/test.py
+++ b/tests/integration/test_concurrent_queries_for_user_restriction/test.py
@@ -1,8 +1,7 @@
 import time
+from multiprocessing.dummy import Pool
 
 import pytest
-
-from multiprocessing.dummy import Pool
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
@@ -10,6 +9,7 @@ cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', user_configs=['configs/user_restrictions.xml'])
 node2 = cluster.add_instance('node2', user_configs=['configs/user_restrictions.xml'])
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -21,6 +21,7 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_exception_message(started_cluster):
     assert node1.query("select number from nums order by number") == "0\n1\n"
 
@@ -30,7 +31,7 @@ def test_exception_message(started_cluster):
 
     busy_pool = Pool(3)
     busy_pool.map_async(node_busy, xrange(3))
-    time.sleep(1) # wait a little until polling starts
+    time.sleep(1)  # wait a little until polling starts
     try:
         assert node2.query("select number from remote('node1', 'default', 'nums')", user='good') == "0\n1\n"
     except Exception as ex:
diff --git a/tests/integration/test_concurrent_ttl_merges/test.py b/tests/integration/test_concurrent_ttl_merges/test.py
index 1ca303a6dcc..d8ccd3d784f 100644
--- a/tests/integration/test_concurrent_ttl_merges/test.py
+++ b/tests/integration/test_concurrent_ttl_merges/test.py
@@ -1,12 +1,9 @@
 import time
+
 import pytest
-
-import helpers.client as client
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
 from helpers.test_tools import assert_eq_with_retry
 
-
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/fast_background_pool.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/fast_background_pool.xml'], with_zookeeper=True)
@@ -24,14 +21,16 @@ def started_cluster():
 
 
 def count_ttl_merges_in_queue(node, table):
-    result = node.query("SELECT count() FROM system.replication_queue WHERE merge_type = 'TTL_DELETE' and table = '{}'".format(table))
+    result = node.query(
+        "SELECT count() FROM system.replication_queue WHERE merge_type = 'TTL_DELETE' and table = '{}'".format(table))
     if not result:
         return 0
     return int(result.strip())
 
 
 def count_ttl_merges_in_background_pool(node, table):
-    result = node.query("SELECT count() FROM system.merges WHERE merge_type = 'TTL_DELETE' and table = '{}'".format(table))
+    result = node.query(
+        "SELECT count() FROM system.merges WHERE merge_type = 'TTL_DELETE' and table = '{}'".format(table))
     if not result:
         return 0
     return int(result.strip())
@@ -55,12 +54,14 @@ def count_running_mutations(node, table):
 # but it revealed a bug when we assign different merges to the same part
 # on the borders of partitions.
 def test_no_ttl_merges_in_busy_pool(started_cluster):
-    node1.query("CREATE TABLE test_ttl (d DateTime, key UInt64, data UInt64) ENGINE = MergeTree() ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0, number_of_free_entries_in_pool_to_execute_mutation = 0")
+    node1.query(
+        "CREATE TABLE test_ttl (d DateTime, key UInt64, data UInt64) ENGINE = MergeTree() ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0, number_of_free_entries_in_pool_to_execute_mutation = 0")
 
     node1.query("SYSTEM STOP TTL MERGES")
 
     for i in range(1, 7):
-        node1.query("INSERT INTO test_ttl SELECT now() - INTERVAL 1 MONTH + number - 1, {}, number FROM numbers(5)".format(i))
+        node1.query(
+            "INSERT INTO test_ttl SELECT now() - INTERVAL 1 MONTH + number - 1, {}, number FROM numbers(5)".format(i))
 
     node1.query("ALTER TABLE test_ttl UPDATE data = data + 1 WHERE sleepEachRow(1) = 0")
 
@@ -80,7 +81,8 @@ def test_no_ttl_merges_in_busy_pool(started_cluster):
 
 
 def test_limited_ttl_merges_in_empty_pool(started_cluster):
-    node1.query("CREATE TABLE test_ttl_v2 (d DateTime, key UInt64, data UInt64) ENGINE = MergeTree() ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0")
+    node1.query(
+        "CREATE TABLE test_ttl_v2 (d DateTime, key UInt64, data UInt64) ENGINE = MergeTree() ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0")
 
     node1.query("SYSTEM STOP TTL MERGES")
 
@@ -102,7 +104,8 @@ def test_limited_ttl_merges_in_empty_pool(started_cluster):
 
 
 def test_limited_ttl_merges_in_empty_pool_replicated(started_cluster):
-    node1.query("CREATE TABLE replicated_ttl (d DateTime, key UInt64, data UInt64) ENGINE = ReplicatedMergeTree('/test/t', '1') ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0")
+    node1.query(
+        "CREATE TABLE replicated_ttl (d DateTime, key UInt64, data UInt64) ENGINE = ReplicatedMergeTree('/test/t', '1') ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0")
 
     node1.query("SYSTEM STOP TTL MERGES")
 
@@ -129,14 +132,17 @@ def test_limited_ttl_merges_in_empty_pool_replicated(started_cluster):
 def test_limited_ttl_merges_two_replicas(started_cluster):
     # Actually this test quite fast and often we cannot catch any merges.
     # To check for sure just add some sleeps in mergePartsToTemporaryPart
-    node1.query("CREATE TABLE replicated_ttl_2 (d DateTime, key UInt64, data UInt64) ENGINE = ReplicatedMergeTree('/test/t2', '1') ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0")
-    node2.query("CREATE TABLE replicated_ttl_2 (d DateTime, key UInt64, data UInt64) ENGINE = ReplicatedMergeTree('/test/t2', '2') ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0")
+    node1.query(
+        "CREATE TABLE replicated_ttl_2 (d DateTime, key UInt64, data UInt64) ENGINE = ReplicatedMergeTree('/test/t2', '1') ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0")
+    node2.query(
+        "CREATE TABLE replicated_ttl_2 (d DateTime, key UInt64, data UInt64) ENGINE = ReplicatedMergeTree('/test/t2', '2') ORDER BY tuple() PARTITION BY key TTL d + INTERVAL 1 MONTH SETTINGS merge_with_ttl_timeout = 0")
 
     node1.query("SYSTEM STOP TTL MERGES")
     node2.query("SYSTEM STOP TTL MERGES")
 
     for i in range(100):
-        node1.query("INSERT INTO replicated_ttl_2 SELECT now() - INTERVAL 1 MONTH, {}, number FROM numbers(10000)".format(i))
+        node1.query(
+            "INSERT INTO replicated_ttl_2 SELECT now() - INTERVAL 1 MONTH, {}, number FROM numbers(10000)".format(i))
 
     node2.query("SYSTEM SYNC REPLICA replicated_ttl_2", timeout=10)
     assert node1.query("SELECT COUNT() FROM replicated_ttl_2") == "1000000\n"
@@ -150,7 +156,8 @@ def test_limited_ttl_merges_two_replicas(started_cluster):
     while True:
         merges_with_ttl_count_node1.add(count_ttl_merges_in_background_pool(node1, "replicated_ttl_2"))
         merges_with_ttl_count_node2.add(count_ttl_merges_in_background_pool(node2, "replicated_ttl_2"))
-        if node1.query("SELECT COUNT() FROM replicated_ttl_2") == "0\n" and node2.query("SELECT COUNT() FROM replicated_ttl_2") == "0\n":
+        if node1.query("SELECT COUNT() FROM replicated_ttl_2") == "0\n" and node2.query(
+                "SELECT COUNT() FROM replicated_ttl_2") == "0\n":
             break
 
     # Both replicas can assign merges with TTL. If one will perform better than
diff --git a/tests/integration/test_config_corresponding_root/test.py b/tests/integration/test_config_corresponding_root/test.py
index 1c714654820..da6af7d11ef 100644
--- a/tests/integration/test_config_corresponding_root/test.py
+++ b/tests/integration/test_config_corresponding_root/test.py
@@ -1,6 +1,6 @@
 import os
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
@@ -9,6 +9,7 @@ cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', main_configs=["configs/config.d/bad.xml"])
 caught_exception = ""
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     global caught_exception
@@ -17,6 +18,7 @@ def start_cluster():
     except Exception as e:
         caught_exception = str(e)
 
+
 def test_work(start_cluster):
     print(caught_exception)
     assert caught_exception.find("Root element doesn't have the corresponding root element as the config file.") != -1
diff --git a/tests/integration/test_config_substitutions/test.py b/tests/integration/test_config_substitutions/test.py
index 8472f85a285..3a2d0d98281 100644
--- a/tests/integration/test_config_substitutions/test.py
+++ b/tests/integration/test_config_substitutions/test.py
@@ -1,21 +1,26 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', user_configs=['configs/config_no_substs.xml']) # hardcoded value 33333
-node2 = cluster.add_instance('node2', user_configs=['configs/config_env.xml'], env_variables={"MAX_QUERY_SIZE": "55555"})
+node1 = cluster.add_instance('node1', user_configs=['configs/config_no_substs.xml'])  # hardcoded value 33333
+node2 = cluster.add_instance('node2', user_configs=['configs/config_env.xml'],
+                             env_variables={"MAX_QUERY_SIZE": "55555"})
 node3 = cluster.add_instance('node3', user_configs=['configs/config_zk.xml'], with_zookeeper=True)
-node4 = cluster.add_instance('node4', user_configs=['configs/config_incl.xml'], main_configs=['configs/max_query_size.xml']) # include value 77777
+node4 = cluster.add_instance('node4', user_configs=['configs/config_incl.xml'],
+                             main_configs=['configs/max_query_size.xml'])  # include value 77777
 node5 = cluster.add_instance('node5', user_configs=['configs/config_allow_databases.xml'])
-node6 = cluster.add_instance('node6', user_configs=['configs/config_include_from_env.xml'], env_variables={"INCLUDE_FROM_ENV": "/etc/clickhouse-server/config.d/max_query_size.xml"}, main_configs=['configs/max_query_size.xml'])
+node6 = cluster.add_instance('node6', user_configs=['configs/config_include_from_env.xml'],
+                             env_variables={"INCLUDE_FROM_ENV": "/etc/clickhouse-server/config.d/max_query_size.xml"},
+                             main_configs=['configs/max_query_size.xml'])
+
 
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
         def create_zk_roots(zk):
             zk.create(path="/setting/max_query_size", value="77777", makepath=True)
+
         cluster.add_zookeeper_startup_command(create_zk_roots)
 
         cluster.start()
@@ -23,25 +28,36 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_config(start_cluster):
-   assert node1.query("select value from system.settings where name = 'max_query_size'") == "33333\n"
-   assert node2.query("select value from system.settings where name = 'max_query_size'") == "55555\n"
-   assert node3.query("select value from system.settings where name = 'max_query_size'") == "77777\n"
-   assert node4.query("select value from system.settings where name = 'max_query_size'") == "99999\n"
-   assert node6.query("select value from system.settings where name = 'max_query_size'") == "99999\n"
+    assert node1.query("select value from system.settings where name = 'max_query_size'") == "33333\n"
+    assert node2.query("select value from system.settings where name = 'max_query_size'") == "55555\n"
+    assert node3.query("select value from system.settings where name = 'max_query_size'") == "77777\n"
+    assert node4.query("select value from system.settings where name = 'max_query_size'") == "99999\n"
+    assert node6.query("select value from system.settings where name = 'max_query_size'") == "99999\n"
+
 
 def test_allow_databases(start_cluster):
     node5.query("CREATE DATABASE db1")
-    node5.query("CREATE TABLE db1.test_table(date Date, k1 String, v1 Int32) ENGINE = MergeTree(date, (k1, date), 8192)")
+    node5.query(
+        "CREATE TABLE db1.test_table(date Date, k1 String, v1 Int32) ENGINE = MergeTree(date, (k1, date), 8192)")
     node5.query("INSERT INTO db1.test_table VALUES('2000-01-01', 'test_key', 1)")
     assert node5.query("SELECT name FROM system.databases WHERE name = 'db1'") == "db1\n"
-    assert node5.query("SELECT name FROM system.tables WHERE database = 'db1' AND name = 'test_table' ") == "test_table\n"
-    assert node5.query("SELECT name FROM system.columns WHERE database = 'db1' AND table = 'test_table'") == "date\nk1\nv1\n"
-    assert node5.query("SELECT name FROM system.parts WHERE database = 'db1' AND table = 'test_table'") == "20000101_20000101_1_1_0\n"
-    assert node5.query("SELECT name FROM system.parts_columns WHERE database = 'db1' AND table = 'test_table'") == "20000101_20000101_1_1_0\n20000101_20000101_1_1_0\n20000101_20000101_1_1_0\n"
+    assert node5.query(
+        "SELECT name FROM system.tables WHERE database = 'db1' AND name = 'test_table' ") == "test_table\n"
+    assert node5.query(
+        "SELECT name FROM system.columns WHERE database = 'db1' AND table = 'test_table'") == "date\nk1\nv1\n"
+    assert node5.query(
+        "SELECT name FROM system.parts WHERE database = 'db1' AND table = 'test_table'") == "20000101_20000101_1_1_0\n"
+    assert node5.query(
+        "SELECT name FROM system.parts_columns WHERE database = 'db1' AND table = 'test_table'") == "20000101_20000101_1_1_0\n20000101_20000101_1_1_0\n20000101_20000101_1_1_0\n"
 
     assert node5.query("SELECT name FROM system.databases WHERE name = 'db1'", user="test_allow").strip() == ""
-    assert node5.query("SELECT name FROM system.tables WHERE database = 'db1' AND name = 'test_table'", user="test_allow").strip() == ""
-    assert node5.query("SELECT name FROM system.columns WHERE database = 'db1' AND table = 'test_table'", user="test_allow").strip() == ""
-    assert node5.query("SELECT name FROM system.parts WHERE database = 'db1' AND table = 'test_table'", user="test_allow").strip() == ""
-    assert node5.query("SELECT name FROM system.parts_columns WHERE database = 'db1' AND table = 'test_table'", user="test_allow").strip() == ""
+    assert node5.query("SELECT name FROM system.tables WHERE database = 'db1' AND name = 'test_table'",
+                       user="test_allow").strip() == ""
+    assert node5.query("SELECT name FROM system.columns WHERE database = 'db1' AND table = 'test_table'",
+                       user="test_allow").strip() == ""
+    assert node5.query("SELECT name FROM system.parts WHERE database = 'db1' AND table = 'test_table'",
+                       user="test_allow").strip() == ""
+    assert node5.query("SELECT name FROM system.parts_columns WHERE database = 'db1' AND table = 'test_table'",
+                       user="test_allow").strip() == ""
diff --git a/tests/integration/test_consistant_parts_after_move_partition/test.py b/tests/integration/test_consistant_parts_after_move_partition/test.py
index 312f5dc30af..05e721ee5ea 100644
--- a/tests/integration/test_consistant_parts_after_move_partition/test.py
+++ b/tests/integration/test_consistant_parts_after_move_partition/test.py
@@ -1,12 +1,8 @@
-import os
-
 import pytest
 
 from helpers.cluster import ClickHouseCluster
-from helpers.network import PartitionManager
 from helpers.test_tools import assert_eq_with_retry
 
-
 CLICKHOUSE_DATABASE = 'test'
 
 
@@ -46,13 +42,14 @@ def test_consistent_part_after_move_partition(start_cluster):
     # insert into all replicas
     for i in range(100):
         node1.query('INSERT INTO `{database}`.src VALUES ({value} % 2, {value})'.format(database=CLICKHOUSE_DATABASE,
-                                                                                       value=i))
+                                                                                        value=i))
     query_source = 'SELECT COUNT(*) FROM `{database}`.src'.format(database=CLICKHOUSE_DATABASE)
     query_dest = 'SELECT COUNT(*) FROM `{database}`.dest'.format(database=CLICKHOUSE_DATABASE)
     assert_eq_with_retry(node2, query_source, node1.query(query_source))
     assert_eq_with_retry(node2, query_dest, node1.query(query_dest))
 
-    node1.query('ALTER TABLE `{database}`.src MOVE PARTITION 1 TO TABLE `{database}`.dest'.format(database=CLICKHOUSE_DATABASE))
+    node1.query(
+        'ALTER TABLE `{database}`.src MOVE PARTITION 1 TO TABLE `{database}`.dest'.format(database=CLICKHOUSE_DATABASE))
 
     assert_eq_with_retry(node2, query_source, node1.query(query_source))
     assert_eq_with_retry(node2, query_dest, node1.query(query_dest))
diff --git a/tests/integration/test_consistent_parts_after_clone_replica/test.py b/tests/integration/test_consistent_parts_after_clone_replica/test.py
index b8a58242ad1..60b91bcb282 100644
--- a/tests/integration/test_consistent_parts_after_clone_replica/test.py
+++ b/tests/integration/test_consistent_parts_after_clone_replica/test.py
@@ -8,19 +8,20 @@ from helpers.test_tools import assert_eq_with_retry
 def fill_nodes(nodes, shard):
     for node in nodes:
         node.query(
-        '''
-        CREATE DATABASE test;
-        CREATE TABLE test_table(date Date, id UInt32)
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}')
-        ORDER BY id PARTITION BY toYYYYMM(date) 
-        SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
-        '''.format(shard=shard, replica=node.name))
+            '''
+            CREATE DATABASE test;
+            CREATE TABLE test_table(date Date, id UInt32)
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}')
+            ORDER BY id PARTITION BY toYYYYMM(date) 
+            SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            '''.format(shard=shard, replica=node.name))
 
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -56,5 +57,3 @@ def test_inconsistent_parts_if_drop_while_replica_not_active(start_cluster):
         # the first replica will be cloned from the second
         pm.heal_all()
         assert_eq_with_retry(node1, "SELECT count(*) FROM test_table", node2.query("SELECT count(*) FROM test_table"))
-
-
diff --git a/tests/integration/test_cross_replication/test.py b/tests/integration/test_cross_replication/test.py
index 6c1172912ed..9171fea5547 100644
--- a/tests/integration/test_cross_replication/test.py
+++ b/tests/integration/test_cross_replication/test.py
@@ -2,18 +2,17 @@ import time
 from contextlib import contextmanager
 
 import pytest
-
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
 from helpers.test_tools import assert_eq_with_retry
 
-
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
diff --git a/tests/integration/test_custom_settings/test.py b/tests/integration/test_custom_settings/test.py
index 62c765a6ba0..32df79ec1e9 100644
--- a/tests/integration/test_custom_settings/test.py
+++ b/tests/integration/test_custom_settings/test.py
@@ -2,7 +2,8 @@ import pytest
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
-node = cluster.add_instance('node', main_configs=["configs/config.d/text_log.xml"], user_configs=["configs/users.d/custom_settings.xml"])
+node = cluster.add_instance('node', main_configs=["configs/config.d/text_log.xml"],
+                            user_configs=["configs/users.d/custom_settings.xml"])
 
 
 @pytest.fixture(scope="module", autouse=True)
@@ -22,9 +23,10 @@ def test():
     assert node.query("SELECT getSetting('custom_d')") == "some text\n"
 
     assert "custom_a = -5, custom_b = 10000000000, custom_c = -4.325, custom_d = \\'some text\\'" \
-        in node.query("SHOW CREATE SETTINGS PROFILE default")
+           in node.query("SHOW CREATE SETTINGS PROFILE default")
 
-    assert "no settings profile" in node.query_and_get_error("SHOW CREATE SETTINGS PROFILE profile_with_unknown_setting")
+    assert "no settings profile" in node.query_and_get_error(
+        "SHOW CREATE SETTINGS PROFILE profile_with_unknown_setting")
     assert "no settings profile" in node.query_and_get_error("SHOW CREATE SETTINGS PROFILE profile_illformed_setting")
 
 
@@ -33,9 +35,9 @@ def test_invalid_settings():
     node.query("SYSTEM FLUSH LOGS")
 
     assert node.query("SELECT COUNT() FROM system.text_log WHERE"
-        " message LIKE '%Could not parse profile `profile_illformed_setting`%'"
-        " AND message LIKE '%Couldn\\'t restore Field from dump%'") == "1\n"
+                      " message LIKE '%Could not parse profile `profile_illformed_setting`%'"
+                      " AND message LIKE '%Couldn\\'t restore Field from dump%'") == "1\n"
 
     assert node.query("SELECT COUNT() FROM system.text_log WHERE"
-        " message LIKE '%Could not parse profile `profile_with_unknown_setting`%'"
-        " AND message LIKE '%Setting x is neither a builtin setting nor started with the prefix \\'custom_\\'%'") == "1\n"
+                      " message LIKE '%Could not parse profile `profile_with_unknown_setting`%'"
+                      " AND message LIKE '%Setting x is neither a builtin setting nor started with the prefix \\'custom_\\'%'") == "1\n"
diff --git a/tests/integration/test_ddl_alter_query/test.py b/tests/integration/test_ddl_alter_query/test.py
index 2a16c58c9e6..d65e40084f6 100644
--- a/tests/integration/test_ddl_alter_query/test.py
+++ b/tests/integration/test_ddl_alter_query/test.py
@@ -10,7 +10,6 @@ node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml'
 node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
 
-
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -18,10 +17,14 @@ def started_cluster():
 
         for i, node in enumerate([node1, node2]):
             node.query("CREATE DATABASE testdb")
-            node.query('''CREATE TABLE testdb.test_table(id UInt32, val String) ENGINE = ReplicatedMergeTree('/clickhouse/test/test_table1', '{}') ORDER BY id;'''.format(i))
+            node.query(
+                '''CREATE TABLE testdb.test_table(id UInt32, val String) ENGINE = ReplicatedMergeTree('/clickhouse/test/test_table1', '{}') ORDER BY id;'''.format(
+                    i))
         for i, node in enumerate([node3, node4]):
             node.query("CREATE DATABASE testdb")
-            node.query('''CREATE TABLE testdb.test_table(id UInt32, val String) ENGINE = ReplicatedMergeTree('/clickhouse/test/test_table2', '{}') ORDER BY id;'''.format(i))
+            node.query(
+                '''CREATE TABLE testdb.test_table(id UInt32, val String) ENGINE = ReplicatedMergeTree('/clickhouse/test/test_table2', '{}') ORDER BY id;'''.format(
+                    i))
         yield cluster
 
     finally:
@@ -34,7 +37,8 @@ def test_alter(started_cluster):
     node2.query("SYSTEM SYNC REPLICA testdb.test_table")
     node4.query("SYSTEM SYNC REPLICA testdb.test_table")
 
-    node1.query("ALTER TABLE testdb.test_table ON CLUSTER test_cluster ADD COLUMN somecolumn UInt8 AFTER val", settings={"replication_alter_partitions_sync": "2"})
+    node1.query("ALTER TABLE testdb.test_table ON CLUSTER test_cluster ADD COLUMN somecolumn UInt8 AFTER val",
+                settings={"replication_alter_partitions_sync": "2"})
 
     node1.query("SYSTEM SYNC REPLICA testdb.test_table")
     node2.query("SYSTEM SYNC REPLICA testdb.test_table")
diff --git a/tests/integration/test_default_compression_codec/test.py b/tests/integration/test_default_compression_codec/test.py
index d312a93ba01..3eef292018c 100644
--- a/tests/integration/test_default_compression_codec/test.py
+++ b/tests/integration/test_default_compression_codec/test.py
@@ -1,14 +1,17 @@
-import string
 import random
-import pytest
+import string
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1', main_configs=['configs/default_compression.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/default_compression.xml'], with_zookeeper=True)
-node3 = cluster.add_instance('node3', main_configs=['configs/default_compression.xml'], image='yandex/clickhouse-server', tag='20.3.16', stay_alive=True, with_installed_binary=True)
+node3 = cluster.add_instance('node3', main_configs=['configs/default_compression.xml'],
+                             image='yandex/clickhouse-server', tag='20.3.16', stay_alive=True,
+                             with_installed_binary=True)
+
 
 @pytest.fixture(scope="module")
 def start_cluster():
@@ -21,12 +24,14 @@ def start_cluster():
 
 
 def get_compression_codec_byte(node, table_name, part_name):
-    cmd = "tail -c +17 /var/lib/clickhouse/data/default/{}/{}/data1.bin | od -x -N 1 | head -n 1 | awk '{{print $2}}'".format(table_name, part_name)
+    cmd = "tail -c +17 /var/lib/clickhouse/data/default/{}/{}/data1.bin | od -x -N 1 | head -n 1 | awk '{{print $2}}'".format(
+        table_name, part_name)
     return node.exec_in_container(["bash", "-c", cmd]).strip()
 
 
 def get_second_multiple_codec_byte(node, table_name, part_name):
-    cmd = "tail -c +17 /var/lib/clickhouse/data/default/{}/{}/data1.bin | od -x -j 11 -N 1 | head -n 1 | awk '{{print $2}}'".format(table_name, part_name)
+    cmd = "tail -c +17 /var/lib/clickhouse/data/default/{}/{}/data1.bin | od -x -j 11 -N 1 | head -n 1 | awk '{{print $2}}'".format(
+        table_name, part_name)
     return node.exec_in_container(["bash", "-c", cmd]).strip()
 
 
@@ -74,16 +79,22 @@ def test_default_codec_single(start_cluster):
 
     # Same codec for all
     assert get_compression_codec_byte(node1, "compression_table", "1_0_0_0") == CODECS_MAPPING['ZSTD']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_0_0_0'") == "ZSTD(10)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_0_0_0'") == "ZSTD(10)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_0_0_0'") == "ZSTD(10)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_0_0_0'") == "ZSTD(10)\n"
 
     assert get_compression_codec_byte(node1, "compression_table", "2_0_0_0") == CODECS_MAPPING['ZSTD']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_0_0_0'") == "ZSTD(10)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_0_0_0'") == "ZSTD(10)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_0_0_0'") == "ZSTD(10)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_0_0_0'") == "ZSTD(10)\n"
 
     assert get_compression_codec_byte(node1, "compression_table", "3_0_0_0") == CODECS_MAPPING['ZSTD']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_0_0_0'") == "ZSTD(10)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_0_0_0'") == "ZSTD(10)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_0_0_0'") == "ZSTD(10)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_0_0_0'") == "ZSTD(10)\n"
 
     # just to be sure that replication works
     node1.query("OPTIMIZE TABLE compression_table FINAL")
@@ -101,16 +112,22 @@ def test_default_codec_single(start_cluster):
     node2.query("SYSTEM FLUSH LOGS")
 
     assert get_compression_codec_byte(node1, "compression_table", "1_0_0_1") == CODECS_MAPPING['ZSTD']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_0_0_1'") == "ZSTD(10)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_0_0_1'") == "ZSTD(10)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_0_0_1'") == "ZSTD(10)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_0_0_1'") == "ZSTD(10)\n"
 
     assert get_compression_codec_byte(node1, "compression_table", "2_0_0_1") == CODECS_MAPPING['LZ4HC']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_0_0_1'") == "LZ4HC(5)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_0_0_1'") == "LZ4HC(5)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_0_0_1'") == "LZ4HC(5)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_0_0_1'") == "LZ4HC(5)\n"
 
     assert get_compression_codec_byte(node1, "compression_table", "3_0_0_1") == CODECS_MAPPING['LZ4']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_0_0_1'") == "LZ4\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_0_0_1'") == "LZ4\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_0_0_1'") == "LZ4\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_0_0_1'") == "LZ4\n"
 
     assert node1.query("SELECT COUNT() FROM compression_table") == "3\n"
     assert node2.query("SELECT COUNT() FROM compression_table") == "3\n"
@@ -137,18 +154,24 @@ def test_default_codec_multiple(start_cluster):
     # Same codec for all
     assert get_compression_codec_byte(node1, "compression_table_multiple", "1_0_0_0") == CODECS_MAPPING['Multiple']
     assert get_second_multiple_codec_byte(node1, "compression_table_multiple", "1_0_0_0") == CODECS_MAPPING['ZSTD']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '1_0_0_0'") == "ZSTD(10)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '1_0_0_0'") == "ZSTD(10)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '1_0_0_0'") == "ZSTD(10)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '1_0_0_0'") == "ZSTD(10)\n"
 
     assert get_compression_codec_byte(node1, "compression_table_multiple", "2_0_0_0") == CODECS_MAPPING['Multiple']
     assert get_second_multiple_codec_byte(node1, "compression_table_multiple", "2_0_0_0") == CODECS_MAPPING['ZSTD']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '2_0_0_0'") == "ZSTD(10)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '2_0_0_0'") == "ZSTD(10)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '2_0_0_0'") == "ZSTD(10)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '2_0_0_0'") == "ZSTD(10)\n"
 
     assert get_compression_codec_byte(node1, "compression_table_multiple", "3_0_0_0") == CODECS_MAPPING['Multiple']
     assert get_second_multiple_codec_byte(node1, "compression_table_multiple", "3_0_0_0") == CODECS_MAPPING['ZSTD']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '3_0_0_0'") == "ZSTD(10)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '3_0_0_0'") == "ZSTD(10)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '3_0_0_0'") == "ZSTD(10)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '3_0_0_0'") == "ZSTD(10)\n"
 
     node2.query("SYSTEM SYNC REPLICA compression_table_multiple", timeout=15)
 
@@ -156,18 +179,24 @@ def test_default_codec_multiple(start_cluster):
 
     assert get_compression_codec_byte(node1, "compression_table_multiple", "1_0_0_1") == CODECS_MAPPING['Multiple']
     assert get_second_multiple_codec_byte(node1, "compression_table_multiple", "1_0_0_1") == CODECS_MAPPING['ZSTD']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '1_0_0_1'") == "ZSTD(10)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '1_0_0_1'") == "ZSTD(10)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '1_0_0_1'") == "ZSTD(10)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '1_0_0_1'") == "ZSTD(10)\n"
 
     assert get_compression_codec_byte(node1, "compression_table_multiple", "2_0_0_1") == CODECS_MAPPING['Multiple']
     assert get_second_multiple_codec_byte(node1, "compression_table_multiple", "2_0_0_1") == CODECS_MAPPING['LZ4HC']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '2_0_0_1'") == "LZ4HC(5)\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '2_0_0_1'") == "LZ4HC(5)\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '2_0_0_1'") == "LZ4HC(5)\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '2_0_0_1'") == "LZ4HC(5)\n"
 
     assert get_compression_codec_byte(node1, "compression_table_multiple", "3_0_0_1") == CODECS_MAPPING['Multiple']
     assert get_second_multiple_codec_byte(node1, "compression_table_multiple", "3_0_0_1") == CODECS_MAPPING['LZ4']
-    assert node1.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '3_0_0_1'") == "LZ4\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '3_0_0_1'") == "LZ4\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '3_0_0_1'") == "LZ4\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table_multiple' and name = '3_0_0_1'") == "LZ4\n"
 
     assert node1.query("SELECT COUNT() FROM compression_table_multiple") == "3\n"
     assert node2.query("SELECT COUNT() FROM compression_table_multiple") == "3\n"
@@ -187,15 +216,21 @@ def test_default_codec_version_update(start_cluster):
 
     node3.restart_with_latest_version()
 
-    assert node3.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_1_1_0'") == "ZSTD(1)\n"
-    assert node3.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_2_2_0'") == "ZSTD(1)\n"
-    assert node3.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_3_3_0'") == "ZSTD(1)\n"
+    assert node3.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_1_1_0'") == "ZSTD(1)\n"
+    assert node3.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_2_2_0'") == "ZSTD(1)\n"
+    assert node3.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_3_3_0'") == "ZSTD(1)\n"
 
     node3.query("OPTIMIZE TABLE compression_table FINAL")
 
-    assert node3.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_1_1_1'") == "ZSTD(10)\n"
-    assert node3.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_2_2_1'") == "LZ4HC(5)\n"
-    assert node3.query("SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_3_3_1'") == "LZ4\n"
+    assert node3.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '1_1_1_1'") == "ZSTD(10)\n"
+    assert node3.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '2_2_2_1'") == "LZ4HC(5)\n"
+    assert node3.query(
+        "SELECT default_compression_codec FROM system.parts WHERE table = 'compression_table' and name = '3_3_3_1'") == "LZ4\n"
     assert get_compression_codec_byte(node1, "compression_table_multiple", "2_0_0_1") == CODECS_MAPPING['Multiple']
     assert get_second_multiple_codec_byte(node1, "compression_table_multiple", "2_0_0_1") == CODECS_MAPPING['LZ4HC']
     assert get_compression_codec_byte(node1, "compression_table_multiple", "3_0_0_1") == CODECS_MAPPING['Multiple']
diff --git a/tests/integration/test_default_database_on_cluster/test.py b/tests/integration/test_default_database_on_cluster/test.py
index cfe11c34660..28a3cfad1d1 100644
--- a/tests/integration/test_default_database_on_cluster/test.py
+++ b/tests/integration/test_default_database_on_cluster/test.py
@@ -1,12 +1,20 @@
-import time
 import pytest
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
-ch1 = cluster.add_instance('ch1', main_configs=["configs/config.d/clusters.xml", "configs/config.d/distributed_ddl.xml"], with_zookeeper=True)
-ch2 = cluster.add_instance('ch2', main_configs=["configs/config.d/clusters.xml", "configs/config.d/distributed_ddl.xml"], with_zookeeper=True)
-ch3 = cluster.add_instance('ch3', main_configs=["configs/config.d/clusters.xml", "configs/config.d/distributed_ddl.xml"], with_zookeeper=True)
-ch4 = cluster.add_instance('ch4', main_configs=["configs/config.d/clusters.xml", "configs/config.d/distributed_ddl.xml"], with_zookeeper=True)
+ch1 = cluster.add_instance('ch1',
+                           main_configs=["configs/config.d/clusters.xml", "configs/config.d/distributed_ddl.xml"],
+                           with_zookeeper=True)
+ch2 = cluster.add_instance('ch2',
+                           main_configs=["configs/config.d/clusters.xml", "configs/config.d/distributed_ddl.xml"],
+                           with_zookeeper=True)
+ch3 = cluster.add_instance('ch3',
+                           main_configs=["configs/config.d/clusters.xml", "configs/config.d/distributed_ddl.xml"],
+                           with_zookeeper=True)
+ch4 = cluster.add_instance('ch4',
+                           main_configs=["configs/config.d/clusters.xml", "configs/config.d/distributed_ddl.xml"],
+                           with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
@@ -20,13 +28,17 @@ def started_cluster():
 
 
 def test_default_database_on_cluster(started_cluster):
-    ch1.query(database='test_default_database', sql="CREATE TABLE test_local_table ON CLUSTER 'cluster' (column UInt8) ENGINE = Memory;")
+    ch1.query(database='test_default_database',
+              sql="CREATE TABLE test_local_table ON CLUSTER 'cluster' (column UInt8) ENGINE = Memory;")
 
     for node in [ch1, ch2, ch3, ch4]:
         assert node.query("SHOW TABLES FROM test_default_database FORMAT TSV") == "test_local_table\n"
 
-    ch1.query(database='test_default_database', sql="CREATE TABLE test_distributed_table ON CLUSTER 'cluster' (column UInt8) ENGINE = Distributed(cluster, currentDatabase(), 'test_local_table');")
+    ch1.query(database='test_default_database',
+              sql="CREATE TABLE test_distributed_table ON CLUSTER 'cluster' (column UInt8) ENGINE = Distributed(cluster, currentDatabase(), 'test_local_table');")
 
     for node in [ch1, ch2, ch3, ch4]:
-        assert node.query("SHOW TABLES FROM test_default_database FORMAT TSV") == "test_distributed_table\ntest_local_table\n"
-        assert node.query("SHOW CREATE TABLE test_default_database.test_distributed_table FORMAT TSV") == "CREATE TABLE test_default_database.test_distributed_table\\n(\\n    `column` UInt8\\n)\\nENGINE = Distributed(\\'cluster\\', \\'test_default_database\\', \\'test_local_table\\')\n"
+        assert node.query(
+            "SHOW TABLES FROM test_default_database FORMAT TSV") == "test_distributed_table\ntest_local_table\n"
+        assert node.query(
+            "SHOW CREATE TABLE test_default_database.test_distributed_table FORMAT TSV") == "CREATE TABLE test_default_database.test_distributed_table\\n(\\n    `column` UInt8\\n)\\nENGINE = Distributed(\\'cluster\\', \\'test_default_database\\', \\'test_local_table\\')\n"
diff --git a/tests/integration/test_default_role/test.py b/tests/integration/test_default_role/test.py
index 2b6b4698b20..2f00fb603a8 100644
--- a/tests/integration/test_default_role/test.py
+++ b/tests/integration/test_default_role/test.py
@@ -1,7 +1,6 @@
 import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
-import re
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance')
@@ -11,7 +10,7 @@ instance = cluster.add_instance('instance')
 def started_cluster():
     try:
         cluster.start()
-        
+
         instance.query("CREATE USER john")
         instance.query("CREATE ROLE rx")
         instance.query("CREATE ROLE ry")
@@ -32,41 +31,41 @@ def test_set_default_roles():
     assert instance.query("SHOW CURRENT ROLES", user="john") == ""
 
     instance.query("GRANT rx, ry TO john")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['rx', 0, 1], ['ry', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['rx', 0, 1], ['ry', 0, 1]])
 
     instance.query("SET DEFAULT ROLE NONE TO john")
     assert instance.query("SHOW CURRENT ROLES", user="john") == ""
 
     instance.query("SET DEFAULT ROLE rx TO john")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['rx', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['rx', 0, 1]])
 
     instance.query("SET DEFAULT ROLE ry TO john")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['ry', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['ry', 0, 1]])
 
     instance.query("SET DEFAULT ROLE ALL TO john")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['rx', 0, 1], ['ry', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['rx', 0, 1], ['ry', 0, 1]])
 
     instance.query("SET DEFAULT ROLE ALL EXCEPT rx TO john")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['ry', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['ry', 0, 1]])
 
 
 def test_alter_user():
     assert instance.query("SHOW CURRENT ROLES", user="john") == ""
 
     instance.query("GRANT rx, ry TO john")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['rx', 0, 1], ['ry', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['rx', 0, 1], ['ry', 0, 1]])
 
     instance.query("ALTER USER john DEFAULT ROLE NONE")
     assert instance.query("SHOW CURRENT ROLES", user="john") == ""
 
     instance.query("ALTER USER john DEFAULT ROLE rx")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['rx', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['rx', 0, 1]])
 
     instance.query("ALTER USER john DEFAULT ROLE ALL")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['rx', 0, 1], ['ry', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['rx', 0, 1], ['ry', 0, 1]])
 
     instance.query("ALTER USER john DEFAULT ROLE ALL EXCEPT rx")
-    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV( [['ry', 0, 1]] )
+    assert instance.query("SHOW CURRENT ROLES", user="john") == TSV([['ry', 0, 1]])
 
 
 def test_wrong_set_default_role():
diff --git a/tests/integration/test_delayed_replica_failover/test.py b/tests/integration/test_delayed_replica_failover/test.py
index 882cd566472..f657edae6fb 100644
--- a/tests/integration/test_delayed_replica_failover/test.py
+++ b/tests/integration/test_delayed_replica_failover/test.py
@@ -1,14 +1,14 @@
-import pytest
+import os
+import sys
 import time
-import os, sys
+
+import pytest
 
 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
-import helpers
 
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
 
-
 cluster = ClickHouseCluster(__file__)
 
 # Cluster with 2 shards of 2 replicas each. node_1_1 is the instance with Distributed table.
@@ -19,6 +19,7 @@ node_1_2 = cluster.add_instance('node_1_2', with_zookeeper=True)
 node_2_1 = cluster.add_instance('node_2_1', with_zookeeper=True)
 node_2_2 = cluster.add_instance('node_2_2', with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -30,7 +31,7 @@ def started_cluster():
                 node.query('''
 CREATE TABLE replicated (d Date, x UInt32) ENGINE =
     ReplicatedMergeTree('/clickhouse/tables/{shard}/replicated', '{instance}', d, d, 8192)'''
-                    .format(shard=shard, instance=node.name))
+                           .format(shard=shard, instance=node.name))
 
         node_1_1.query(
             "CREATE TABLE distributed (d Date, x UInt32) ENGINE = "
@@ -51,7 +52,7 @@ def test(started_cluster):
         node_1_2.query("INSERT INTO replicated VALUES ('2017-05-08', 1)")
         node_2_2.query("INSERT INTO replicated VALUES ('2017-05-08', 2)")
 
-        time.sleep(1) # accrue replica delay
+        time.sleep(1)  # accrue replica delay
 
         assert node_1_1.query("SELECT sum(x) FROM replicated").strip() == '0'
         assert node_1_2.query("SELECT sum(x) FROM replicated").strip() == '1'
@@ -78,7 +79,7 @@ SELECT sum(x) FROM distributed WITH TOTALS SETTINGS
         pm.drop_instance_zk_connections(node_1_2)
         pm.drop_instance_zk_connections(node_2_2)
 
-        time.sleep(4) # allow pings to zookeeper to timeout (must be greater than ZK session timeout).
+        time.sleep(4)  # allow pings to zookeeper to timeout (must be greater than ZK session timeout).
 
         # At this point all replicas are stale, but the query must still go to second replicas which are the least stale ones.
         assert instance_with_dist_table.query('''
diff --git a/tests/integration/test_dictionaries_access/test.py b/tests/integration/test_dictionaries_access/test.py
index cbba651a3b7..1b64b0de1fb 100644
--- a/tests/integration/test_dictionaries_access/test.py
+++ b/tests/integration/test_dictionaries_access/test.py
@@ -9,7 +9,7 @@ instance = cluster.add_instance('instance')
 def started_cluster():
     try:
         cluster.start()
-        
+
         instance.query("CREATE USER mira")
         instance.query("CREATE TABLE test_table(x Int32, y Int32) ENGINE=Log")
         instance.query("INSERT INTO test_table VALUES (5,6)")
diff --git a/tests/integration/test_dictionaries_all_layouts_and_sources/test.py b/tests/integration/test_dictionaries_all_layouts_and_sources/test.py
index 5a46498ce08..5880ead7c5a 100644
--- a/tests/integration/test_dictionaries_all_layouts_and_sources/test.py
+++ b/tests/integration/test_dictionaries_all_layouts_and_sources/test.py
@@ -1,11 +1,12 @@
-import pytest
+import math
 import os
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.dictionary import Field, Row, Dictionary, DictionaryStructure, Layout
-from helpers.external_sources import SourceMySQL, SourceClickHouse, SourceFile, SourceExecutableCache, SourceExecutableHashed
-from helpers.external_sources import SourceMongo, SourceMongoURI, SourceHTTP, SourceHTTPS, SourceRedis, SourceCassandra
-import math
+from helpers.external_sources import SourceMongo, SourceMongoURI, SourceHTTP, SourceHTTPS, SourceCassandra
+from helpers.external_sources import SourceMySQL, SourceClickHouse, SourceFile, SourceExecutableCache, \
+    SourceExecutableHashed
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 dict_configs_path = os.path.join(SCRIPT_DIR, 'configs/dictionaries')
@@ -103,8 +104,6 @@ VALUES = {
     ]
 }
 
-
-
 LAYOUTS = [
     Layout("flat"),
     Layout("hashed"),
@@ -135,6 +134,7 @@ DICTIONARIES = []
 cluster = None
 node = None
 
+
 def get_dict(source, layout, fields, suffix_name=''):
     global dict_configs_path
 
@@ -173,7 +173,8 @@ def setup_module(module):
     for fname in os.listdir(dict_configs_path):
         dictionaries.append(os.path.join(dict_configs_path, fname))
 
-    node = cluster.add_instance('node', main_configs=main_configs, dictionaries=dictionaries, with_mysql=True, with_mongo=True, with_redis=True, with_cassandra=True)
+    node = cluster.add_instance('node', main_configs=main_configs, dictionaries=dictionaries, with_mysql=True,
+                                with_mongo=True, with_redis=True, with_cassandra=True)
 
 
 @pytest.fixture(scope="module")
@@ -195,7 +196,7 @@ def get_dictionaries(fold, total_folds, all_dicts):
     chunk_len = int(math.ceil(len(all_dicts) / float(total_folds)))
     if chunk_len * fold >= len(all_dicts):
         return []
-    return all_dicts[fold * chunk_len : (fold + 1) * chunk_len]
+    return all_dicts[fold * chunk_len: (fold + 1) * chunk_len]
 
 
 def remove_mysql_dicts():
@@ -225,8 +226,8 @@ def remove_mysql_dicts():
     TODO remove this when open ssl will be fixed or thread sanitizer will be suppressed
     """
 
-    #global DICTIONARIES
-    #DICTIONARIES = [d for d in DICTIONARIES if not d.name.startswith("MySQL")]
+    # global DICTIONARIES
+    # DICTIONARIES = [d for d in DICTIONARIES if not d.name.startswith("MySQL")]
 
 
 @pytest.mark.parametrize("fold", list(range(10)))
@@ -281,7 +282,6 @@ def test_simple_dictionaries(started_cluster, fold):
 
 @pytest.mark.parametrize("fold", list(range(10)))
 def test_complex_dictionaries(started_cluster, fold):
-
     if node.is_built_with_thread_sanitizer():
         remove_mysql_dicts()
 
diff --git a/tests/integration/test_dictionaries_complex_key_cache_string/test.py b/tests/integration/test_dictionaries_complex_key_cache_string/test.py
index 8c676841f16..c8969aee63e 100644
--- a/tests/integration/test_dictionaries_complex_key_cache_string/test.py
+++ b/tests/integration/test_dictionaries_complex_key_cache_string/test.py
@@ -1,30 +1,40 @@
-import pytest
 import os
+
+import pytest
 from helpers.cluster import ClickHouseCluster
 
+
 @pytest.fixture(scope="function")
 def cluster(request):
     SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
     cluster = ClickHouseCluster(__file__)
     try:
         if request.param == "memory":
-            node = cluster.add_instance('node', main_configs=['configs/enable_dictionaries.xml', 'configs/dictionaries/complex_key_cache_string.xml'])
+            node = cluster.add_instance('node', main_configs=['configs/enable_dictionaries.xml',
+                                                              'configs/dictionaries/complex_key_cache_string.xml'])
         if request.param == "ssd":
-            node = cluster.add_instance('node', main_configs=['configs/enable_dictionaries.xml', 'configs/dictionaries/ssd_complex_key_cache_string.xml'])
+            node = cluster.add_instance('node', main_configs=['configs/enable_dictionaries.xml',
+                                                              'configs/dictionaries/ssd_complex_key_cache_string.xml'])
         cluster.start()
-        node.query("create table radars_table (radar_id String, radar_ip String, client_id String) engine=MergeTree() order by radar_id")
+        node.query(
+            "create table radars_table (radar_id String, radar_ip String, client_id String) engine=MergeTree() order by radar_id")
 
         yield cluster
     finally:
         cluster.shutdown()
 
+
 @pytest.mark.parametrize("cluster", ["memory", "ssd"], indirect=True)
 def test_memory_consumption(cluster):
     node = cluster.instances['node']
-    node.query("insert into radars_table select toString(rand() % 5000), '{0}', '{0}' from numbers(1000)".format('w' * 8))
-    node.query("insert into radars_table select toString(rand() % 5000), '{0}', '{0}' from numbers(1000)".format('x' * 16))
-    node.query("insert into radars_table select toString(rand() % 5000), '{0}', '{0}' from numbers(1000)".format('y' * 32))
-    node.query("insert into radars_table select toString(rand() % 5000), '{0}', '{0}' from numbers(1000)".format('z' * 64))
+    node.query(
+        "insert into radars_table select toString(rand() % 5000), '{0}', '{0}' from numbers(1000)".format('w' * 8))
+    node.query(
+        "insert into radars_table select toString(rand() % 5000), '{0}', '{0}' from numbers(1000)".format('x' * 16))
+    node.query(
+        "insert into radars_table select toString(rand() % 5000), '{0}', '{0}' from numbers(1000)".format('y' * 32))
+    node.query(
+        "insert into radars_table select toString(rand() % 5000), '{0}', '{0}' from numbers(1000)".format('z' * 64))
 
     # Fill dictionary
     node.query("select dictGetString('radars', 'client_id', tuple(toString(number))) from numbers(0, 5000)")
diff --git a/tests/integration/test_dictionaries_ddl/test.py b/tests/integration/test_dictionaries_ddl/test.py
index cc7536d4b36..d69a4ab5ba6 100644
--- a/tests/integration/test_dictionaries_ddl/test.py
+++ b/tests/integration/test_dictionaries_ddl/test.py
@@ -1,16 +1,23 @@
-import pytest
 import os
-from helpers.cluster import ClickHouseCluster
-from helpers.client import QueryRuntimeException
-import pymysql
 import warnings
 
+import pymysql
+import pytest
+from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
+
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', with_mysql=True, dictionaries=['configs/dictionaries/simple_dictionary.xml'], user_configs=['configs/user_admin.xml', 'configs/user_default.xml'])
-node2 = cluster.add_instance('node2', with_mysql=True, dictionaries=['configs/dictionaries/simple_dictionary.xml'], main_configs=['configs/dictionaries/lazy_load.xml', 'configs/allow_remote_node.xml'], user_configs=['configs/user_admin.xml', 'configs/user_default.xml'])
-node3 = cluster.add_instance('node3', main_configs=['configs/allow_remote_node.xml'], dictionaries=['configs/dictionaries/dictionary_with_conflict_name.xml', 'configs/dictionaries/conflict_name_dictionary.xml'], user_configs=['configs/user_admin.xml'])
+node1 = cluster.add_instance('node1', with_mysql=True, dictionaries=['configs/dictionaries/simple_dictionary.xml'],
+                             user_configs=['configs/user_admin.xml', 'configs/user_default.xml'])
+node2 = cluster.add_instance('node2', with_mysql=True, dictionaries=['configs/dictionaries/simple_dictionary.xml'],
+                             main_configs=['configs/dictionaries/lazy_load.xml', 'configs/allow_remote_node.xml'],
+                             user_configs=['configs/user_admin.xml', 'configs/user_default.xml'])
+node3 = cluster.add_instance('node3', main_configs=['configs/allow_remote_node.xml'],
+                             dictionaries=['configs/dictionaries/dictionary_with_conflict_name.xml',
+                                           'configs/dictionaries/conflict_name_dictionary.xml'],
+                             user_configs=['configs/user_admin.xml'])
 node4 = cluster.add_instance('node4', user_configs=['configs/user_admin.xml', 'configs/config_password.xml'])
 
 
@@ -21,6 +28,7 @@ def create_mysql_conn(user, password, hostname, port):
         host=hostname,
         port=port)
 
+
 def execute_mysql_query(connection, query):
     with warnings.catch_warnings():
         warnings.simplefilter("ignore")
@@ -35,15 +43,18 @@ def started_cluster():
         cluster.start()
         for clickhouse in [node1, node2, node3, node4]:
             clickhouse.query("CREATE DATABASE test", user="admin")
-            clickhouse.query("CREATE TABLE test.xml_dictionary_table (id UInt64, SomeValue1 UInt8, SomeValue2 String) ENGINE = MergeTree() ORDER BY id", user="admin")
-            clickhouse.query("INSERT INTO test.xml_dictionary_table SELECT number, number % 23, hex(number) from numbers(1000)", user="admin")
+            clickhouse.query(
+                "CREATE TABLE test.xml_dictionary_table (id UInt64, SomeValue1 UInt8, SomeValue2 String) ENGINE = MergeTree() ORDER BY id",
+                user="admin")
+            clickhouse.query(
+                "INSERT INTO test.xml_dictionary_table SELECT number, number % 23, hex(number) from numbers(1000)",
+                user="admin")
         yield cluster
 
     finally:
         cluster.shutdown()
 
 
-
 @pytest.mark.parametrize("clickhouse,name,layout", [
     (node1, 'complex_node1_hashed', 'LAYOUT(COMPLEX_KEY_HASHED())'),
     (node1, 'complex_node1_cache', 'LAYOUT(COMPLEX_KEY_CACHE(SIZE_IN_CELLS 10))'),
@@ -53,7 +64,9 @@ def started_cluster():
 def test_create_and_select_mysql(started_cluster, clickhouse, name, layout):
     mysql_conn = create_mysql_conn("root", "clickhouse", "localhost", 3308)
     execute_mysql_query(mysql_conn, "CREATE DATABASE IF NOT EXISTS clickhouse")
-    execute_mysql_query(mysql_conn, "CREATE TABLE clickhouse.{} (key_field1 int, key_field2 bigint, value1 text, value2 float, PRIMARY KEY (key_field1, key_field2))".format(name))
+    execute_mysql_query(mysql_conn,
+                        "CREATE TABLE clickhouse.{} (key_field1 int, key_field2 bigint, value1 text, value2 float, PRIMARY KEY (key_field1, key_field2))".format(
+                            name))
     values = []
     for i in range(1000):
         values.append('(' + ','.join([str(i), str(i * i), str(i) * 5, str(i * 3.14)]) + ')')
@@ -80,12 +93,16 @@ def test_create_and_select_mysql(started_cluster, clickhouse, name, layout):
     """.format(name, name, layout))
 
     for i in range(172, 200):
-        assert clickhouse.query("SELECT dictGetString('default.{}', 'value1', tuple(toInt32({}), toInt64({})))".format(name, i, i * i)) == str(i) * 5 + '\n'
-        stroka = clickhouse.query("SELECT dictGetFloat32('default.{}', 'value2', tuple(toInt32({}), toInt64({})))".format(name, i, i * i)).strip()
+        assert clickhouse.query(
+            "SELECT dictGetString('default.{}', 'value1', tuple(toInt32({}), toInt64({})))".format(name, i,
+                                                                                                   i * i)) == str(
+            i) * 5 + '\n'
+        stroka = clickhouse.query(
+            "SELECT dictGetFloat32('default.{}', 'value2', tuple(toInt32({}), toInt64({})))".format(name, i,
+                                                                                                    i * i)).strip()
         value = float(stroka)
         assert int(value) == int(i * 3.14)
 
-
     for i in range(1000):
         values.append('(' + ','.join([str(i), str(i * i), str(i) * 3, str(i * 2.718)]) + ')')
     execute_mysql_query(mysql_conn, "REPLACE INTO clickhouse.{} VALUES ".format(name) + ','.join(values))
@@ -93,8 +110,13 @@ def test_create_and_select_mysql(started_cluster, clickhouse, name, layout):
     clickhouse.query("SYSTEM RELOAD DICTIONARY 'default.{}'".format(name))
 
     for i in range(172, 200):
-        assert clickhouse.query("SELECT dictGetString('default.{}', 'value1', tuple(toInt32({}), toInt64({})))".format(name, i, i * i)) == str(i) * 3 + '\n'
-        string = clickhouse.query("SELECT dictGetFloat32('default.{}', 'value2', tuple(toInt32({}), toInt64({})))".format(name, i, i * i)).strip()
+        assert clickhouse.query(
+            "SELECT dictGetString('default.{}', 'value1', tuple(toInt32({}), toInt64({})))".format(name, i,
+                                                                                                   i * i)) == str(
+            i) * 3 + '\n'
+        string = clickhouse.query(
+            "SELECT dictGetFloat32('default.{}', 'value2', tuple(toInt32({}), toInt64({})))".format(name, i,
+                                                                                                    i * i)).strip()
         value = float(string)
         assert int(value) == int(i * 2.718)
 
@@ -182,6 +204,7 @@ def test_conflicting_name(started_cluster):
     # old version still works
     node3.query("select dictGetUInt8('test.conflicting_dictionary', 'SomeValue1', toUInt64(17))") == '17\n'
 
+
 def test_http_dictionary_restrictions(started_cluster):
     try:
         node3.query("""
@@ -198,6 +221,7 @@ def test_http_dictionary_restrictions(started_cluster):
     except QueryRuntimeException as ex:
         assert 'is not allowed in config.xml' in str(ex)
 
+
 def test_file_dictionary_restrictions(started_cluster):
     try:
         node3.query("""
@@ -218,7 +242,8 @@ def test_file_dictionary_restrictions(started_cluster):
 def test_dictionary_with_where(started_cluster):
     mysql_conn = create_mysql_conn("root", "clickhouse", "localhost", 3308)
     execute_mysql_query(mysql_conn, "CREATE DATABASE IF NOT EXISTS clickhouse")
-    execute_mysql_query(mysql_conn, "CREATE TABLE clickhouse.special_table (key_field1 int, value1 text, PRIMARY KEY (key_field1))")
+    execute_mysql_query(mysql_conn,
+                        "CREATE TABLE clickhouse.special_table (key_field1 int, value1 text, PRIMARY KEY (key_field1))")
     execute_mysql_query(mysql_conn, "INSERT INTO clickhouse.special_table VALUES (1, 'abcabc'), (2, 'qweqwe')")
 
     node1.query("""
@@ -243,6 +268,7 @@ def test_dictionary_with_where(started_cluster):
 
     assert node1.query("SELECT dictGetString('default.special_dict', 'value1', toUInt64(2))") == 'qweqwe\n'
 
+
 def test_clickhouse_remote(started_cluster):
     with pytest.raises(QueryRuntimeException):
         node3.query("""
@@ -272,4 +298,3 @@ def test_clickhouse_remote(started_cluster):
         """)
 
     node3.query("select dictGetUInt8('test.clickhouse_remote', 'SomeValue1', toUInt64(17))") == '17\n'
-
diff --git a/tests/integration/test_dictionaries_dependency/test.py b/tests/integration/test_dictionaries_dependency/test.py
index 4505bf73a7c..119bd7c6863 100644
--- a/tests/integration/test_dictionaries_dependency/test.py
+++ b/tests/integration/test_dictionaries_dependency/test.py
@@ -17,10 +17,10 @@ def start_cluster():
             node.query("CREATE DATABASE IF NOT EXISTS ztest")
             node.query("CREATE TABLE test.source(x UInt64, y UInt64) ENGINE=Log")
             node.query("INSERT INTO test.source VALUES (5,6)")
-            
-            node.query("CREATE DICTIONARY test.dict(x UInt64, y UInt64) PRIMARY KEY x "\
-                        "SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE 'source' DB 'test')) "\
-                        "LAYOUT(FLAT()) LIFETIME(0)")
+
+            node.query("CREATE DICTIONARY test.dict(x UInt64, y UInt64) PRIMARY KEY x " \
+                       "SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE 'source' DB 'test')) " \
+                       "LAYOUT(FLAT()) LIFETIME(0)")
         yield cluster
 
     finally:
@@ -48,14 +48,14 @@ def cleanup_after_test():
 def test_dependency_via_implicit_table(node):
     d_names = ["test.adict", "test.zdict", "atest.dict", "ztest.dict"]
     for d_name in d_names:
-        node.query("CREATE DICTIONARY {}(x UInt64, y UInt64) PRIMARY KEY x "\
-                   "SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE 'dict' DB 'test')) "\
+        node.query("CREATE DICTIONARY {}(x UInt64, y UInt64) PRIMARY KEY x " \
+                   "SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE 'dict' DB 'test')) " \
                    "LAYOUT(FLAT()) LIFETIME(0)".format(d_name))
-    
+
     def check():
         for d_name in d_names:
             assert node.query("SELECT dictGet({}, 'y', toUInt64(5))".format(d_name)) == "6\n"
-    
+
     check()
 
     # Restart must not break anything.
@@ -72,14 +72,14 @@ def test_dependency_via_explicit_table(node):
         tbl_database, tbl_shortname = tbl_name.split('.')
         d_name = d_names[i]
         node.query("CREATE TABLE {}(x UInt64, y UInt64) ENGINE=Dictionary('test.dict')".format(tbl_name))
-        node.query("CREATE DICTIONARY {}(x UInt64, y UInt64) PRIMARY KEY x "\
-                   "SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE '{}' DB '{}')) "\
+        node.query("CREATE DICTIONARY {}(x UInt64, y UInt64) PRIMARY KEY x " \
+                   "SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE '{}' DB '{}')) " \
                    "LAYOUT(FLAT()) LIFETIME(0)".format(d_name, tbl_shortname, tbl_database))
-    
+
     def check():
         for d_name in d_names:
             assert node.query("SELECT dictGet({}, 'y', toUInt64(5))".format(d_name)) == "6\n"
-    
+
     check()
 
     # Restart must not break anything.
@@ -93,14 +93,14 @@ def test_dependency_via_dictionary_database(node):
 
     d_names = ["test.adict", "test.zdict", "atest.dict", "ztest.dict"]
     for d_name in d_names:
-        node.query("CREATE DICTIONARY {}(x UInt64, y UInt64) PRIMARY KEY x "\
-                   "SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE 'test.dict' DB 'dict_db')) "\
+        node.query("CREATE DICTIONARY {}(x UInt64, y UInt64) PRIMARY KEY x " \
+                   "SOURCE(CLICKHOUSE(HOST 'localhost' PORT 9000 USER 'default' TABLE 'test.dict' DB 'dict_db')) " \
                    "LAYOUT(FLAT()) LIFETIME(0)".format(d_name))
-    
+
     def check():
         for d_name in d_names:
             assert node.query("SELECT dictGet({}, 'y', toUInt64(5))".format(d_name)) == "6\n"
-    
+
     check()
 
     # Restart must not break anything.
diff --git a/tests/integration/test_dictionaries_dependency_xml/test.py b/tests/integration/test_dictionaries_dependency_xml/test.py
index da1146cd54c..d5453bb4814 100644
--- a/tests/integration/test_dictionaries_dependency_xml/test.py
+++ b/tests/integration/test_dictionaries_dependency_xml/test.py
@@ -1,13 +1,13 @@
 import pytest
-import os
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
 ENABLE_DICT_CONFIG = ['configs/enable_dictionaries.xml']
-DICTIONARY_FILES = ['configs/dictionaries/dep_x.xml', 'configs/dictionaries/dep_y.xml', 'configs/dictionaries/dep_z.xml']
+DICTIONARY_FILES = ['configs/dictionaries/dep_x.xml', 'configs/dictionaries/dep_y.xml',
+                    'configs/dictionaries/dep_z.xml']
 
 cluster = ClickHouseCluster(__file__)
-instance = cluster.add_instance('instance', main_configs=ENABLE_DICT_CONFIG+DICTIONARY_FILES,)
+instance = cluster.add_instance('instance', main_configs=ENABLE_DICT_CONFIG + DICTIONARY_FILES, )
 
 
 @pytest.fixture(scope="module")
@@ -60,14 +60,14 @@ def test_get_data(started_cluster):
     query("INSERT INTO test.elements VALUES (3, 'fire', 30, 8)")
 
     # Wait for dictionaries to be reloaded.
-    assert_eq_with_retry(instance, "SELECT dictHas('dep_y', toUInt64(3))", "1", sleep_time = 2, retry_count = 10)
+    assert_eq_with_retry(instance, "SELECT dictHas('dep_y', toUInt64(3))", "1", sleep_time=2, retry_count=10)
     assert query("SELECT dictGetString('dep_x', 'a', toUInt64(3))") == "XX\n"
     assert query("SELECT dictGetString('dep_y', 'a', toUInt64(3))") == "fire\n"
     assert query("SELECT dictGetString('dep_z', 'a', toUInt64(3))") == "ZZ\n"
 
     # dep_x and dep_z are updated only when there `intDiv(count(), 4)`  is changed.
     query("INSERT INTO test.elements VALUES (4, 'ether', 404, 0.001)")
-    assert_eq_with_retry(instance, "SELECT dictHas('dep_x', toUInt64(4))", "1", sleep_time = 2, retry_count = 10)
+    assert_eq_with_retry(instance, "SELECT dictHas('dep_x', toUInt64(4))", "1", sleep_time=2, retry_count=10)
     assert query("SELECT dictGetString('dep_x', 'a', toUInt64(3))") == "fire\n"
     assert query("SELECT dictGetString('dep_y', 'a', toUInt64(3))") == "fire\n"
     assert query("SELECT dictGetString('dep_z', 'a', toUInt64(3))") == "fire\n"
diff --git a/tests/integration/test_dictionaries_mysql/test.py b/tests/integration/test_dictionaries_mysql/test.py
index 4d2a063e91d..a8e91c94d00 100644
--- a/tests/integration/test_dictionaries_mysql/test.py
+++ b/tests/integration/test_dictionaries_mysql/test.py
@@ -1,17 +1,13 @@
-import pytest
-import os
-import time
-
 ## sudo -H pip install PyMySQL
 import pymysql.cursors
-
+import pytest
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry
 
-CONFIG_FILES = ['configs/dictionaries/mysql_dict1.xml', 'configs/dictionaries/mysql_dict2.xml', 'configs/remote_servers.xml']
+CONFIG_FILES = ['configs/dictionaries/mysql_dict1.xml', 'configs/dictionaries/mysql_dict2.xml',
+                'configs/remote_servers.xml']
 CONFIG_FILES += ['configs/enable_dictionaries.xml']
 cluster = ClickHouseCluster(__file__)
-instance = cluster.add_instance('instance', main_configs=CONFIG_FILES, with_mysql = True)
+instance = cluster.add_instance('instance', main_configs=CONFIG_FILES, with_mysql=True)
 
 create_table_mysql_template = """
     CREATE TABLE IF NOT EXISTS `test`.`{}` (
@@ -25,10 +21,11 @@ create_clickhouse_dictionary_table_template = """
     CREATE TABLE IF NOT EXISTS `test`.`dict_table_{}` (`id` UInt64, `value` String) ENGINE = Dictionary({})
     """
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
-        #time.sleep(30)
+        # time.sleep(30)
         cluster.start()
 
         # Create a MySQL database
@@ -66,10 +63,12 @@ def test_load_mysql_dictionaries(started_cluster):
         # Check number of row
         assert query("SELECT count() FROM `test`.`dict_table_{}`".format('test' + str(n % 5))).rstrip() == '10000'
 
+
 def create_mysql_db(mysql_connection, name):
     with mysql_connection.cursor() as cursor:
         cursor.execute("CREATE DATABASE IF NOT EXISTS {} DEFAULT CHARACTER SET 'utf8'".format(name))
 
+
 def prepare_mysql_table(table_name, index):
     mysql_connection = get_mysql_conn()
 
@@ -78,17 +77,21 @@ def prepare_mysql_table(table_name, index):
 
     # Insert rows using CH
     query = instance.query
-    query("INSERT INTO `clickhouse_mysql`.{}(id, value) select number, concat('{} value ', toString(number)) from numbers(10000) ".format(table_name + str(index), table_name + str(index)))
+    query(
+        "INSERT INTO `clickhouse_mysql`.{}(id, value) select number, concat('{} value ', toString(number)) from numbers(10000) ".format(
+            table_name + str(index), table_name + str(index)))
     assert query("SELECT count() FROM `clickhouse_mysql`.{}".format(table_name + str(index))).rstrip() == '10000'
     mysql_connection.close()
 
-    #Create CH Dictionary tables based on MySQL tables
+    # Create CH Dictionary tables based on MySQL tables
     query(create_clickhouse_dictionary_table_template.format(table_name + str(index), 'dict' + str(index)))
 
+
 def get_mysql_conn():
     conn = pymysql.connect(user='root', password='clickhouse', host='127.0.0.10', port=3308)
     return conn
 
+
 def create_mysql_table(conn, table_name):
     with conn.cursor() as cursor:
         cursor.execute(create_table_mysql_template.format(table_name))
diff --git a/tests/integration/test_dictionaries_null_value/test.py b/tests/integration/test_dictionaries_null_value/test.py
index c4ad3782498..3c3ef59902f 100644
--- a/tests/integration/test_dictionaries_null_value/test.py
+++ b/tests/integration/test_dictionaries_null_value/test.py
@@ -1,13 +1,11 @@
 import pytest
-import os
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV, assert_eq_with_retry
 
 ENABLE_DICT_CONFIG = ['configs/enable_dictionaries.xml']
 DICTIONARY_FILES = ['configs/dictionaries/cache.xml']
 
 cluster = ClickHouseCluster(__file__)
-instance = cluster.add_instance('instance', main_configs=ENABLE_DICT_CONFIG+DICTIONARY_FILES)
+instance = cluster.add_instance('instance', main_configs=ENABLE_DICT_CONFIG + DICTIONARY_FILES)
 
 
 @pytest.fixture(scope="module")
@@ -42,4 +40,5 @@ def test_null_value(started_cluster):
 
     # Check, that empty null_value interprets as default value
     assert query("select dictGetUInt64('cache', 'UInt64_', toUInt64(12121212))") == "0\n"
-    assert query("select toTimeZone(dictGetDateTime('cache', 'DateTime_', toUInt64(12121212)), 'UTC')") == "1970-01-01 00:00:00\n"
+    assert query(
+        "select toTimeZone(dictGetDateTime('cache', 'DateTime_', toUInt64(12121212)), 'UTC')") == "1970-01-01 00:00:00\n"
diff --git a/tests/integration/test_dictionaries_redis/test.py b/tests/integration/test_dictionaries_redis/test.py
index 1588efa3426..385580816e0 100644
--- a/tests/integration/test_dictionaries_redis/test.py
+++ b/tests/integration/test_dictionaries_redis/test.py
@@ -1,7 +1,6 @@
 import os
-import pytest
-import redis
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.dictionary import Field, Row, Dictionary, DictionaryStructure, Layout
 from helpers.external_sources import SourceRedis
@@ -22,10 +21,10 @@ KEY_FIELDS = {
 }
 
 KEY_VALUES = {
-    "simple" : [
+    "simple": [
         [1], [2]
     ],
-    "complex" : [
+    "complex": [
         [1, 'world'], [2, 'qwerty2']
     ]
 }
@@ -76,6 +75,7 @@ LAYOUTS = [
 
 DICTIONARIES = []
 
+
 def get_dict(source, layout, fields, suffix_name=''):
     global dict_configs_path
 
@@ -99,8 +99,10 @@ def setup_module(module):
     for i, field in enumerate(FIELDS):
         DICTIONARIES.append([])
         sources = []
-        sources.append(SourceRedis("RedisSimple", "localhost", "6380", "redis1", "6379", "", "clickhouse", i * 2, storage_type="simple"))
-        sources.append(SourceRedis("RedisHash", "localhost", "6380", "redis1", "6379", "", "clickhouse", i * 2 + 1, storage_type="hash_map"))
+        sources.append(SourceRedis("RedisSimple", "localhost", "6380", "redis1", "6379", "", "clickhouse", i * 2,
+                                   storage_type="simple"))
+        sources.append(SourceRedis("RedisHash", "localhost", "6380", "redis1", "6379", "", "clickhouse", i * 2 + 1,
+                                   storage_type="hash_map"))
         for source in sources:
             for layout in LAYOUTS:
                 if not source.compatible_with_layout(layout):
@@ -118,6 +120,7 @@ def setup_module(module):
     cluster = ClickHouseCluster(__file__)
     node = cluster.add_instance('node', main_configs=main_configs, dictionaries=dictionaries, with_redis=True)
 
+
 @pytest.fixture(scope="module", autouse=True)
 def started_cluster():
     try:
@@ -134,6 +137,7 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 @pytest.mark.parametrize("id", range(len(FIELDS)))
 def test_redis_dictionaries(started_cluster, id):
     print 'id:', id
diff --git a/tests/integration/test_dictionaries_select_all/generate_dictionaries.py b/tests/integration/test_dictionaries_select_all/generate_dictionaries.py
index 30a5648fdbe..5c92d0d67e8 100644
--- a/tests/integration/test_dictionaries_select_all/generate_dictionaries.py
+++ b/tests/integration/test_dictionaries_select_all/generate_dictionaries.py
@@ -1,6 +1,5 @@
-import os
-import glob
 import difflib
+import os
 
 files = ['key_simple.tsv', 'key_complex_integers.tsv', 'key_complex_mixed.tsv']
 
@@ -12,7 +11,6 @@ types = [
     'Date', 'DateTime'
 ]
 
-
 implicit_defaults = [
     '1', '1', '1', '',
     '-1', '-1', '-1', '-1',
diff --git a/tests/integration/test_dictionaries_select_all/test.py b/tests/integration/test_dictionaries_select_all/test.py
index 7dc93b2df44..5b8d39a7a63 100644
--- a/tests/integration/test_dictionaries_select_all/test.py
+++ b/tests/integration/test_dictionaries_select_all/test.py
@@ -1,7 +1,9 @@
-import pytest
 import os
+
+import pytest
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV, assert_eq_with_retry
+from helpers.test_tools import TSV
+
 from generate_dictionaries import generate_structure, generate_dictionaries, DictionaryTestTable
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
@@ -20,7 +22,7 @@ def setup_module(module):
     dictionary_files = generate_dictionaries(os.path.join(SCRIPT_DIR, 'configs/dictionaries'), structure)
 
     cluster = ClickHouseCluster(__file__)
-    instance = cluster.add_instance('instance', main_configs=dictionary_files+['configs/enable_dictionaries.xml'])
+    instance = cluster.add_instance('instance', main_configs=dictionary_files + ['configs/enable_dictionaries.xml'])
     test_table = DictionaryTestTable(os.path.join(SCRIPT_DIR, 'configs/dictionaries/source.tsv'))
 
 
diff --git a/tests/integration/test_dictionaries_update_and_reload/test.py b/tests/integration/test_dictionaries_update_and_reload/test.py
index 762fd3adc28..8dfd10da14d 100644
--- a/tests/integration/test_dictionaries_update_and_reload/test.py
+++ b/tests/integration/test_dictionaries_update_and_reload/test.py
@@ -1,16 +1,18 @@
-import pytest
 import os
 import time
-from helpers.cluster import ClickHouseCluster
+
+import pytest
 from helpers.client import QueryTimeoutExceedException
+from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 ENABLE_DICT_CONFIG = ['configs/enable_dictionaries.xml']
-DICTIONARY_FILES = ['configs/dictionaries/cache_xypairs.xml', 'configs/dictionaries/executable.xml', 'configs/dictionaries/file.xml', 'configs/dictionaries/file.txt', 'configs/dictionaries/slow.xml']
+DICTIONARY_FILES = ['configs/dictionaries/cache_xypairs.xml', 'configs/dictionaries/executable.xml',
+                    'configs/dictionaries/file.xml', 'configs/dictionaries/file.txt', 'configs/dictionaries/slow.xml']
 
 cluster = ClickHouseCluster(__file__)
-instance = cluster.add_instance('instance', main_configs=ENABLE_DICT_CONFIG+DICTIONARY_FILES)
+instance = cluster.add_instance('instance', main_configs=ENABLE_DICT_CONFIG + DICTIONARY_FILES)
 
 
 @pytest.fixture(scope="module")
@@ -30,24 +32,31 @@ def get_status(dictionary_name):
 
 
 def get_last_exception(dictionary_name):
-    return instance.query("SELECT last_exception FROM system.dictionaries WHERE name='" + dictionary_name + "'").rstrip("\n").replace("\\'", "'")
+    return instance.query("SELECT last_exception FROM system.dictionaries WHERE name='" + dictionary_name + "'").rstrip(
+        "\n").replace("\\'", "'")
 
 
 def get_loading_start_time(dictionary_name):
-    s = instance.query("SELECT toTimeZone(loading_start_time, 'UTC') FROM system.dictionaries WHERE name='" + dictionary_name + "'").rstrip("\n")
+    s = instance.query(
+        "SELECT toTimeZone(loading_start_time, 'UTC') FROM system.dictionaries WHERE name='" + dictionary_name + "'").rstrip(
+        "\n")
     if s == "1970-01-01 00:00:00":
         return None
     return time.strptime(s, "%Y-%m-%d %H:%M:%S")
 
+
 def get_last_successful_update_time(dictionary_name):
-    s = instance.query("SELECT toTimeZone(last_successful_update_time, 'UTC') FROM system.dictionaries WHERE name='" + dictionary_name + "'").rstrip("\n")
+    s = instance.query(
+        "SELECT toTimeZone(last_successful_update_time, 'UTC') FROM system.dictionaries WHERE name='" + dictionary_name + "'").rstrip(
+        "\n")
     if s == "1970-01-01 00:00:00":
         return None
     return time.strptime(s, "%Y-%m-%d %H:%M:%S")
 
 
 def get_loading_duration(dictionary_name):
-    return float(instance.query("SELECT loading_duration FROM system.dictionaries WHERE name='" + dictionary_name + "'"))
+    return float(
+        instance.query("SELECT loading_duration FROM system.dictionaries WHERE name='" + dictionary_name + "'"))
 
 
 def replace_in_file_in_container(file_name, what, replace_with):
@@ -63,14 +72,14 @@ def test_reload_while_loading(started_cluster):
 
     # It's not possible to get a value from the dictionary within 0.5 second, so the following query fails by timeout.
     with pytest.raises(QueryTimeoutExceedException):
-        query("SELECT dictGetInt32('slow', 'a', toUInt64(5))", timeout = 0.5)
+        query("SELECT dictGetInt32('slow', 'a', toUInt64(5))", timeout=0.5)
 
     # The dictionary is now loading.
     assert get_status('slow') == "LOADING"
     start_time, duration = get_loading_start_time('slow'), get_loading_duration('slow')
     assert duration > 0
 
-    time.sleep(0.5) # Still loading.
+    time.sleep(0.5)  # Still loading.
     assert get_status('slow') == "LOADING"
     prev_start_time, prev_duration = start_time, duration
     start_time, duration = get_loading_start_time('slow'), get_loading_duration('slow')
@@ -79,14 +88,14 @@ def test_reload_while_loading(started_cluster):
 
     # SYSTEM RELOAD DICTIONARY should restart loading.
     with pytest.raises(QueryTimeoutExceedException):
-        query("SYSTEM RELOAD DICTIONARY 'slow'", timeout = 0.5)
+        query("SYSTEM RELOAD DICTIONARY 'slow'", timeout=0.5)
     assert get_status('slow') == "LOADING"
     prev_start_time, prev_duration = start_time, duration
     start_time, duration = get_loading_start_time('slow'), get_loading_duration('slow')
     assert start_time > prev_start_time
     assert duration < prev_duration
 
-    time.sleep(0.5) # Still loading.
+    time.sleep(0.5)  # Still loading.
     assert get_status('slow') == "LOADING"
     prev_start_time, prev_duration = start_time, duration
     start_time, duration = get_loading_start_time('slow'), get_loading_duration('slow')
@@ -95,7 +104,7 @@ def test_reload_while_loading(started_cluster):
 
     # Changing the configuration file should restart loading again.
     replace_in_file_in_container('/etc/clickhouse-server/config.d/slow.xml', 'sleep 100', 'sleep 0')
-    time.sleep(5) # Configuration files are reloaded once in 5 seconds.
+    time.sleep(5)  # Configuration files are reloaded once in 5 seconds.
 
     # This time loading should finish quickly.
     assert get_status('slow') == "LOADED"
@@ -129,7 +138,7 @@ def test_reload_after_loading(started_cluster):
     assert query("SELECT dictGetInt32('file', 'a', toUInt64(9))") == "101\n"
 
     # SYSTEM RELOAD DICTIONARIES reloads all loaded dictionaries.
-    time.sleep(1) # see the comment above
+    time.sleep(1)  # see the comment above
     replace_in_file_in_container('/etc/clickhouse-server/config.d/executable.xml', '81', '82')
     replace_in_file_in_container('/etc/clickhouse-server/config.d/file.txt', '101', '102')
     query("SYSTEM RELOAD DICTIONARIES")
@@ -138,7 +147,7 @@ def test_reload_after_loading(started_cluster):
 
     # Configuration files are reloaded and lifetimes are checked automatically once in 5 seconds.
     # Wait slightly more, to be sure it did reload.
-    time.sleep(1) # see the comment above
+    time.sleep(1)  # see the comment above
     replace_in_file_in_container('/etc/clickhouse-server/config.d/executable.xml', '82', '83')
     replace_in_file_in_container('/etc/clickhouse-server/config.d/file.txt', '102', '103')
     time.sleep(7)
@@ -163,7 +172,8 @@ def test_reload_after_fail_by_system_reload(started_cluster):
     assert get_status("no_file") == "FAILED"
 
     # Creating the file source makes the dictionary able to load.
-    instance.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/dictionaries/file.txt"), "/etc/clickhouse-server/config.d/no_file.txt")
+    instance.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/dictionaries/file.txt"),
+                                    "/etc/clickhouse-server/config.d/no_file.txt")
     query("SYSTEM RELOAD DICTIONARY 'no_file'")
     query("SELECT dictGetInt32('no_file', 'a', toUInt64(9))") == "10\n"
     assert get_status("no_file") == "LOADED"
@@ -192,7 +202,8 @@ def test_reload_after_fail_by_timer(started_cluster):
     assert get_status("no_file_2") == "FAILED"
 
     # Creating the file source makes the dictionary able to load.
-    instance.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/dictionaries/file.txt"), "/etc/clickhouse-server/config.d/no_file_2.txt")
+    instance.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/dictionaries/file.txt"),
+                                    "/etc/clickhouse-server/config.d/no_file_2.txt")
     time.sleep(6);
     query("SELECT dictGetInt32('no_file_2', 'a', toUInt64(9))") == "10\n"
     assert get_status("no_file_2") == "LOADED"
diff --git a/tests/integration/test_dictionary_allow_read_expired_keys/test_default_reading.py b/tests/integration/test_dictionary_allow_read_expired_keys/test_default_reading.py
index b6b742c1de8..1266c37dcd3 100644
--- a/tests/integration/test_dictionary_allow_read_expired_keys/test_default_reading.py
+++ b/tests/integration/test_dictionary_allow_read_expired_keys/test_default_reading.py
@@ -1,9 +1,8 @@
 from __future__ import print_function
-import pytest
-import time
-import os
-from contextlib import contextmanager
 
+import time
+
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.cluster import ClickHouseKiller
 from helpers.network import PartitionManager
@@ -14,6 +13,7 @@ dictionary_node = cluster.add_instance('dictionary_node', stay_alive=True)
 main_node = cluster.add_instance('main_node', main_configs=['configs/enable_dictionaries.xml',
                                                             'configs/dictionaries/cache_ints_dictionary.xml'])
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -32,6 +32,7 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 # @pytest.mark.skip(reason="debugging")
 def test_default_reading(started_cluster):
     assert None != dictionary_node.get_process_pid("clickhouse"), "ClickHouse must be alive"
@@ -39,14 +40,22 @@ def test_default_reading(started_cluster):
     # Key 0 is not in dictionary, so default value will be returned
 
     def test_helper():
-        assert '42' == main_node.query("select dictGetOrDefault('anime_dict', 'i8',  toUInt64(13),  toInt8(42));").rstrip()
-        assert '42' == main_node.query("select dictGetOrDefault('anime_dict', 'i16', toUInt64(13),  toInt16(42));").rstrip()
-        assert '42' == main_node.query("select dictGetOrDefault('anime_dict', 'i32', toUInt64(13),  toInt32(42));").rstrip()
-        assert '42' == main_node.query("select dictGetOrDefault('anime_dict', 'i64', toUInt64(13),  toInt64(42));").rstrip()
-        assert '42' == main_node.query("select dictGetOrDefault('anime_dict', 'u8',  toUInt64(13),  toUInt8(42));").rstrip()
-        assert '42' == main_node.query("select dictGetOrDefault('anime_dict', 'u16', toUInt64(13),  toUInt16(42));").rstrip()
-        assert '42' == main_node.query("select dictGetOrDefault('anime_dict', 'u32', toUInt64(13),  toUInt32(42));").rstrip()
-        assert '42' == main_node.query("select dictGetOrDefault('anime_dict', 'u64', toUInt64(13),  toUInt64(42));").rstrip()
+        assert '42' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'i8',  toUInt64(13),  toInt8(42));").rstrip()
+        assert '42' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'i16', toUInt64(13),  toInt16(42));").rstrip()
+        assert '42' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'i32', toUInt64(13),  toInt32(42));").rstrip()
+        assert '42' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'i64', toUInt64(13),  toInt64(42));").rstrip()
+        assert '42' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'u8',  toUInt64(13),  toUInt8(42));").rstrip()
+        assert '42' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'u16', toUInt64(13),  toUInt16(42));").rstrip()
+        assert '42' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'u32', toUInt64(13),  toUInt32(42));").rstrip()
+        assert '42' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'u64', toUInt64(13),  toUInt64(42));").rstrip()
 
     test_helper()
 
@@ -61,4 +70,3 @@ def test_default_reading(started_cluster):
         time.sleep(3)
 
         test_helper()
-
diff --git a/tests/integration/test_dictionary_allow_read_expired_keys/test_default_string.py b/tests/integration/test_dictionary_allow_read_expired_keys/test_default_string.py
index d6517379086..2aa6fb448ca 100644
--- a/tests/integration/test_dictionary_allow_read_expired_keys/test_default_string.py
+++ b/tests/integration/test_dictionary_allow_read_expired_keys/test_default_string.py
@@ -1,10 +1,11 @@
 from __future__ import print_function
-import pytest
+
 import os
 import random
 import string
 import time
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
@@ -12,13 +13,16 @@ SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 cluster = ClickHouseCluster(__file__)
 
 dictionary_node = cluster.add_instance('dictionary_node', stay_alive=True)
-main_node = cluster.add_instance('main_node', main_configs=['configs/enable_dictionaries.xml','configs/dictionaries/cache_ints_dictionary.xml','configs/dictionaries/cache_strings_default_settings.xml'])
+main_node = cluster.add_instance('main_node', main_configs=['configs/enable_dictionaries.xml',
+                                                            'configs/dictionaries/cache_ints_dictionary.xml',
+                                                            'configs/dictionaries/cache_strings_default_settings.xml'])
 
 
 def get_random_string(string_length=8):
     alphabet = string.ascii_letters + string.digits
     return ''.join((random.choice(alphabet) for _ in range(string_length)))
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -31,13 +35,15 @@ def started_cluster():
                              ENGINE = Memory;
                              """)
 
-        values_to_insert = ", ".join(["({}, '{}')".format(1000000 + number, get_random_string()) for number in range(100)])
+        values_to_insert = ", ".join(
+            ["({}, '{}')".format(1000000 + number, get_random_string()) for number in range(100)])
         dictionary_node.query("INSERT INTO test.strings VALUES {}".format(values_to_insert))
 
         yield cluster
     finally:
         cluster.shutdown()
 
+
 # @pytest.mark.skip(reason="debugging")
 def test_return_real_values(started_cluster):
     assert None != dictionary_node.get_process_pid("clickhouse"), "ClickHouse must be alive"
diff --git a/tests/integration/test_dictionary_allow_read_expired_keys/test_dict_get.py b/tests/integration/test_dictionary_allow_read_expired_keys/test_dict_get.py
index 44698b380e3..9de0b3be4eb 100644
--- a/tests/integration/test_dictionary_allow_read_expired_keys/test_dict_get.py
+++ b/tests/integration/test_dictionary_allow_read_expired_keys/test_dict_get.py
@@ -1,18 +1,18 @@
 from __future__ import print_function
-import pytest
-import time
-import os
-from contextlib import contextmanager
 
+import time
+
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.cluster import ClickHouseKiller
 from helpers.network import PartitionManager
-from helpers.network import PartitionManagerDisabler
 
 cluster = ClickHouseCluster(__file__)
 
 dictionary_node = cluster.add_instance('dictionary_node', stay_alive=True)
-main_node = cluster.add_instance('main_node', main_configs=['configs/enable_dictionaries.xml', 'configs/dictionaries/cache_ints_dictionary.xml'])
+main_node = cluster.add_instance('main_node', main_configs=['configs/enable_dictionaries.xml',
+                                                            'configs/dictionaries/cache_ints_dictionary.xml'])
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
diff --git a/tests/integration/test_dictionary_allow_read_expired_keys/test_dict_get_or_default.py b/tests/integration/test_dictionary_allow_read_expired_keys/test_dict_get_or_default.py
index e0b546aae24..31f0e469555 100644
--- a/tests/integration/test_dictionary_allow_read_expired_keys/test_dict_get_or_default.py
+++ b/tests/integration/test_dictionary_allow_read_expired_keys/test_dict_get_or_default.py
@@ -1,9 +1,8 @@
 from __future__ import print_function
-import pytest
-import time
-import os
-from contextlib import contextmanager
 
+import time
+
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.cluster import ClickHouseKiller
 from helpers.network import PartitionManager
@@ -11,7 +10,9 @@ from helpers.network import PartitionManager
 cluster = ClickHouseCluster(__file__)
 
 dictionary_node = cluster.add_instance('dictionary_node', stay_alive=True)
-main_node = cluster.add_instance('main_node', main_configs=['configs/enable_dictionaries.xml','configs/dictionaries/cache_ints_dictionary.xml'])
+main_node = cluster.add_instance('main_node', main_configs=['configs/enable_dictionaries.xml',
+                                                            'configs/dictionaries/cache_ints_dictionary.xml'])
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
@@ -31,19 +32,28 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 # @pytest.mark.skip(reason="debugging")
 def test_simple_dict_get_or_default(started_cluster):
     assert None != dictionary_node.get_process_pid("clickhouse"), "ClickHouse must be alive"
 
     def test_helper():
-        assert '5' == main_node.query("select dictGetOrDefault('anime_dict', 'i8',  toUInt64(5),  toInt8(42));").rstrip()
-        assert '5' == main_node.query("select dictGetOrDefault('anime_dict', 'i16', toUInt64(5),  toInt16(42));").rstrip()
-        assert '5' == main_node.query("select dictGetOrDefault('anime_dict', 'i32', toUInt64(5),  toInt32(42));").rstrip()
-        assert '5' == main_node.query("select dictGetOrDefault('anime_dict', 'i64', toUInt64(5),  toInt64(42));").rstrip()
-        assert '5' == main_node.query("select dictGetOrDefault('anime_dict', 'u8',  toUInt64(5),  toUInt8(42));").rstrip()
-        assert '5' == main_node.query("select dictGetOrDefault('anime_dict', 'u16', toUInt64(5),  toUInt16(42));").rstrip()
-        assert '5' == main_node.query("select dictGetOrDefault('anime_dict', 'u32', toUInt64(5),  toUInt32(42));").rstrip()
-        assert '5' == main_node.query("select dictGetOrDefault('anime_dict', 'u64', toUInt64(5),  toUInt64(42));").rstrip()
+        assert '5' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'i8',  toUInt64(5),  toInt8(42));").rstrip()
+        assert '5' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'i16', toUInt64(5),  toInt16(42));").rstrip()
+        assert '5' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'i32', toUInt64(5),  toInt32(42));").rstrip()
+        assert '5' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'i64', toUInt64(5),  toInt64(42));").rstrip()
+        assert '5' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'u8',  toUInt64(5),  toUInt8(42));").rstrip()
+        assert '5' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'u16', toUInt64(5),  toUInt16(42));").rstrip()
+        assert '5' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'u32', toUInt64(5),  toUInt32(42));").rstrip()
+        assert '5' == main_node.query(
+            "select dictGetOrDefault('anime_dict', 'u64', toUInt64(5),  toUInt64(42));").rstrip()
 
     test_helper()
 
diff --git a/tests/integration/test_dictionary_custom_settings/http_server.py b/tests/integration/test_dictionary_custom_settings/http_server.py
index c7920a9024d..20487ccf447 100644
--- a/tests/integration/test_dictionary_custom_settings/http_server.py
+++ b/tests/integration/test_dictionary_custom_settings/http_server.py
@@ -1,9 +1,9 @@
 # -*- coding: utf-8 -*-
 import argparse
-from BaseHTTPServer import BaseHTTPRequestHandler, HTTPServer
+import csv
 import socket
 import ssl
-import csv
+from BaseHTTPServer import BaseHTTPRequestHandler, HTTPServer
 
 
 # Decorator used to see if authentication works for external dictionary who use a HTTP source.
@@ -15,6 +15,7 @@ def check_auth(fn):
             req.send_response(401)
         else:
             fn(req)
+
     return wrapper
 
 
@@ -37,7 +38,7 @@ def start_server(server_address, data_path, schema, cert_path, address_family):
             self.send_header('Content-type', 'text/csv')
             self.end_headers()
 
-        def __send_data(self, only_ids = None):
+        def __send_data(self, only_ids=None):
             with open(data_path, 'r') as fl:
                 reader = csv.reader(fl, delimiter='\t')
                 for row in reader:
diff --git a/tests/integration/test_dictionary_custom_settings/test.py b/tests/integration/test_dictionary_custom_settings/test.py
index e58b40df527..bd16d393c59 100644
--- a/tests/integration/test_dictionary_custom_settings/test.py
+++ b/tests/integration/test_dictionary_custom_settings/test.py
@@ -1,6 +1,6 @@
 import os
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 ENABLE_DICT_CONFIG = ['configs/enable_dictionaries.xml']
@@ -13,7 +13,8 @@ DICTIONARY_FILES = [
 ]
 
 cluster = ClickHouseCluster(__file__)
-instance = cluster.add_instance('node', main_configs=ENABLE_DICT_CONFIG+DICTIONARY_FILES)
+instance = cluster.add_instance('node', main_configs=ENABLE_DICT_CONFIG + DICTIONARY_FILES)
+
 
 def prepare():
     node = instance
@@ -39,6 +40,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_work(start_cluster):
     query = instance.query
 
@@ -58,4 +60,4 @@ def test_work(start_cluster):
     assert caught_exception.find("Limit for result exceeded") != -1
 
     assert query("SELECT dictGetString('test_http', 'first', toUInt64(1))") == "\\\'a\n"
-    assert query("SELECT dictGetString('test_http', 'second', toUInt64(1))") == "\"b\n"
\ No newline at end of file
+    assert query("SELECT dictGetString('test_http', 'second', toUInt64(1))") == "\"b\n"
diff --git a/tests/integration/test_dictionary_ddl_on_cluster/test.py b/tests/integration/test_dictionary_ddl_on_cluster/test.py
index 6239fda1752..feca1532974 100644
--- a/tests/integration/test_dictionary_ddl_on_cluster/test.py
+++ b/tests/integration/test_dictionary_ddl_on_cluster/test.py
@@ -1,19 +1,24 @@
-import time
 import pytest
-from helpers.cluster import ClickHouseCluster
 from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
-ch1 = cluster.add_instance('ch1', main_configs=["configs/config.d/clusters.xml", "configs/config.d/ddl.xml"], with_zookeeper=True)
-ch2 = cluster.add_instance('ch2', main_configs=["configs/config.d/clusters.xml", "configs/config.d/ddl.xml"], with_zookeeper=True)
-ch3 = cluster.add_instance('ch3', main_configs=["configs/config.d/clusters.xml", "configs/config.d/ddl.xml"], with_zookeeper=True)
-ch4 = cluster.add_instance('ch4', main_configs=["configs/config.d/clusters.xml", "configs/config.d/ddl.xml"], with_zookeeper=True)
+ch1 = cluster.add_instance('ch1', main_configs=["configs/config.d/clusters.xml", "configs/config.d/ddl.xml"],
+                           with_zookeeper=True)
+ch2 = cluster.add_instance('ch2', main_configs=["configs/config.d/clusters.xml", "configs/config.d/ddl.xml"],
+                           with_zookeeper=True)
+ch3 = cluster.add_instance('ch3', main_configs=["configs/config.d/clusters.xml", "configs/config.d/ddl.xml"],
+                           with_zookeeper=True)
+ch4 = cluster.add_instance('ch4', main_configs=["configs/config.d/clusters.xml", "configs/config.d/ddl.xml"],
+                           with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
         cluster.start()
-        ch1.query("CREATE TABLE sometbl ON CLUSTER 'cluster' (key UInt64, value String) ENGINE = MergeTree ORDER by key")
+        ch1.query(
+            "CREATE TABLE sometbl ON CLUSTER 'cluster' (key UInt64, value String) ENGINE = MergeTree ORDER by key")
         yield cluster
 
     finally:
@@ -27,7 +32,6 @@ def test_dictionary_ddl_on_cluster(started_cluster):
     for num, node in enumerate([ch1, ch2, ch3, ch4]):
         node.query("insert into sometbl values ({}, '{}')".format(num, node.name))
 
-
     ch1.query(
         """
         CREATE DICTIONARY somedict ON CLUSTER 'cluster' (
@@ -42,7 +46,8 @@ def test_dictionary_ddl_on_cluster(started_cluster):
 
     for num, node in enumerate([ch1, ch2, ch3, ch4]):
         assert node.query("SELECT count() from sometbl") == "1\n"
-        assert node.query("SELECT dictGetString('default.somedict', 'value', toUInt64({}))".format(num)) == node.name + '\n'
+        assert node.query(
+            "SELECT dictGetString('default.somedict', 'value', toUInt64({}))".format(num)) == node.name + '\n'
 
     ch1.query("DETACH DICTIONARY default.somedict ON CLUSTER 'cluster'")
 
@@ -54,8 +59,8 @@ def test_dictionary_ddl_on_cluster(started_cluster):
 
     for num, node in enumerate([ch1, ch2, ch3, ch4]):
         assert node.query("SELECT count() from sometbl") == "1\n"
-        assert node.query("SELECT dictGetString('default.somedict', 'value', toUInt64({}))".format(num)) == node.name + '\n'
-
+        assert node.query(
+            "SELECT dictGetString('default.somedict', 'value', toUInt64({}))".format(num)) == node.name + '\n'
 
     for num, node in enumerate([ch1, ch2, ch3, ch4]):
         node.query("ALTER TABLE sometbl UPDATE value = 'new_key' WHERE 1")
@@ -63,7 +68,8 @@ def test_dictionary_ddl_on_cluster(started_cluster):
     ch1.query("SYSTEM RELOAD DICTIONARY ON CLUSTER 'cluster' `default.somedict`")
 
     for num, node in enumerate([ch1, ch2, ch3, ch4]):
-        assert node.query("SELECT dictGetString('default.somedict', 'value', toUInt64({}))".format(num)) == 'new_key' + '\n'
+        assert node.query(
+            "SELECT dictGetString('default.somedict', 'value', toUInt64({}))".format(num)) == 'new_key' + '\n'
 
     ch1.query("DROP DICTIONARY default.somedict ON CLUSTER 'cluster'")
 
diff --git a/tests/integration/test_disk_access_storage/test.py b/tests/integration/test_disk_access_storage/test.py
index dab6758cbd6..ad31be4284a 100644
--- a/tests/integration/test_disk_access_storage/test.py
+++ b/tests/integration/test_disk_access_storage/test.py
@@ -27,27 +27,32 @@ def create_entities():
 
 @pytest.fixture(autouse=True)
 def drop_entities():
-    instance.query("DROP USER IF EXISTS u1, u2")    
-    instance.query("DROP ROLE IF EXISTS rx, ry")    
+    instance.query("DROP USER IF EXISTS u1, u2")
+    instance.query("DROP ROLE IF EXISTS rx, ry")
     instance.query("DROP ROW POLICY IF EXISTS p ON mydb.mytable")
     instance.query("DROP QUOTA IF EXISTS q")
     instance.query("DROP SETTINGS PROFILE IF EXISTS s1, s2")
-    
+
 
 def test_create():
     create_entities()
 
     def check():
         assert instance.query("SHOW CREATE USER u1") == "CREATE USER u1 SETTINGS PROFILE s1\n"
-        assert instance.query("SHOW CREATE USER u2") == "CREATE USER u2 IDENTIFIED WITH sha256_password HOST LOCAL DEFAULT ROLE rx\n"
-        assert instance.query("SHOW CREATE ROW POLICY p ON mydb.mytable") == "CREATE ROW POLICY p ON mydb.mytable FOR SELECT USING a < 1000 TO u1, u2\n"
-        assert instance.query("SHOW CREATE QUOTA q") == "CREATE QUOTA q FOR INTERVAL 1 hour MAX queries = 100 TO ALL EXCEPT rx\n"
+        assert instance.query(
+            "SHOW CREATE USER u2") == "CREATE USER u2 IDENTIFIED WITH sha256_password HOST LOCAL DEFAULT ROLE rx\n"
+        assert instance.query(
+            "SHOW CREATE ROW POLICY p ON mydb.mytable") == "CREATE ROW POLICY p ON mydb.mytable FOR SELECT USING a < 1000 TO u1, u2\n"
+        assert instance.query(
+            "SHOW CREATE QUOTA q") == "CREATE QUOTA q FOR INTERVAL 1 hour MAX queries = 100 TO ALL EXCEPT rx\n"
         assert instance.query("SHOW GRANTS FOR u1") == ""
         assert instance.query("SHOW GRANTS FOR u2") == "GRANT rx TO u2\n"
         assert instance.query("SHOW CREATE ROLE rx") == "CREATE ROLE rx SETTINGS PROFILE s1\n"
         assert instance.query("SHOW GRANTS FOR rx") == ""
-        assert instance.query("SHOW CREATE SETTINGS PROFILE s1") == "CREATE SETTINGS PROFILE s1 SETTINGS max_memory_usage = 123456789 MIN 100000000 MAX 200000000\n"
-        assert instance.query("SHOW CREATE SETTINGS PROFILE s2") == "CREATE SETTINGS PROFILE s2 SETTINGS INHERIT s1 TO u2\n"
+        assert instance.query(
+            "SHOW CREATE SETTINGS PROFILE s1") == "CREATE SETTINGS PROFILE s1 SETTINGS max_memory_usage = 123456789 MIN 100000000 MAX 200000000\n"
+        assert instance.query(
+            "SHOW CREATE SETTINGS PROFILE s2") == "CREATE SETTINGS PROFILE s2 SETTINGS INHERIT s1 TO u2\n"
 
     check()
     instance.restart_clickhouse()  # Check persistency
@@ -69,15 +74,18 @@ def test_alter():
 
     def check():
         assert instance.query("SHOW CREATE USER u1") == "CREATE USER u1 SETTINGS PROFILE s1\n"
-        assert instance.query("SHOW CREATE USER u2") == "CREATE USER u2 IDENTIFIED WITH sha256_password HOST LOCAL DEFAULT ROLE ry\n"
+        assert instance.query(
+            "SHOW CREATE USER u2") == "CREATE USER u2 IDENTIFIED WITH sha256_password HOST LOCAL DEFAULT ROLE ry\n"
         assert instance.query("SHOW GRANTS FOR u1") == "GRANT SELECT ON mydb.mytable TO u1\n"
         assert instance.query("SHOW GRANTS FOR u2") == "GRANT rx, ry TO u2\n"
         assert instance.query("SHOW CREATE ROLE rx") == "CREATE ROLE rx SETTINGS PROFILE s2\n"
         assert instance.query("SHOW CREATE ROLE ry") == "CREATE ROLE ry\n"
         assert instance.query("SHOW GRANTS FOR rx") == "GRANT SELECT ON mydb.* TO rx WITH GRANT OPTION\n"
         assert instance.query("SHOW GRANTS FOR ry") == "GRANT rx TO ry WITH ADMIN OPTION\n"
-        assert instance.query("SHOW CREATE SETTINGS PROFILE s1") == "CREATE SETTINGS PROFILE s1 SETTINGS max_memory_usage = 987654321 READONLY\n"
-        assert instance.query("SHOW CREATE SETTINGS PROFILE s2") == "CREATE SETTINGS PROFILE s2 SETTINGS INHERIT s1 TO u2\n"
+        assert instance.query(
+            "SHOW CREATE SETTINGS PROFILE s1") == "CREATE SETTINGS PROFILE s1 SETTINGS max_memory_usage = 987654321 READONLY\n"
+        assert instance.query(
+            "SHOW CREATE SETTINGS PROFILE s2") == "CREATE SETTINGS PROFILE s2 SETTINGS INHERIT s1 TO u2\n"
 
     check()
     instance.restart_clickhouse()  # Check persistency
@@ -98,7 +106,8 @@ def test_drop():
         assert instance.query("SHOW CREATE USER u1") == "CREATE USER u1\n"
         assert instance.query("SHOW CREATE SETTINGS PROFILE s2") == "CREATE SETTINGS PROFILE s2\n"
         assert "There is no user `u2`" in instance.query_and_get_error("SHOW CREATE USER u2")
-        assert "There is no row policy `p ON mydb.mytable`" in instance.query_and_get_error("SHOW CREATE ROW POLICY p ON mydb.mytable")
+        assert "There is no row policy `p ON mydb.mytable`" in instance.query_and_get_error(
+            "SHOW CREATE ROW POLICY p ON mydb.mytable")
         assert "There is no quota `q`" in instance.query_and_get_error("SHOW CREATE QUOTA q")
 
     check()
diff --git a/tests/integration/test_disk_types/test.py b/tests/integration/test_disk_types/test.py
index 3c65315a7e3..a97b90af27d 100644
--- a/tests/integration/test_disk_types/test.py
+++ b/tests/integration/test_disk_types/test.py
@@ -1,15 +1,14 @@
-
 import pytest
 from helpers.cluster import ClickHouseCluster
 
 disk_types = {
-    "default" : "local",
-    "disk_s3" : "s3",
-    "disk_memory" : "memory",
+    "default": "local",
+    "disk_s3": "s3",
+    "disk_memory": "memory",
 }
 
-@pytest.fixture(scope="module")
 
+@pytest.fixture(scope="module")
 def cluster():
     try:
         cluster = ClickHouseCluster(__file__)
@@ -19,19 +18,20 @@ def cluster():
     finally:
         cluster.shutdown()
 
+
 def test_different_types(cluster):
     node = cluster.instances["node"]
     responce = node.query("SELECT * FROM system.disks")
     disks = responce.split("\n")
     for disk in disks:
-        if disk == '': # skip empty line (after split at last position)
+        if disk == '':  # skip empty line (after split at last position)
             continue
         fields = disk.split("\t")
         assert len(fields) >= 6
         assert disk_types.get(fields[0], "UNKNOWN") == fields[5]
 
+
 def test_select_by_type(cluster):
     node = cluster.instances["node"]
     for name, disk_type in disk_types.items():
         assert node.query("SELECT name FROM system.disks WHERE type='" + disk_type + "'") == name + "\n"
-
diff --git a/tests/integration/test_distributed_backward_compatability/test.py b/tests/integration/test_distributed_backward_compatability/test.py
index 7ce7edb2860..eb18019c8df 100644
--- a/tests/integration/test_distributed_backward_compatability/test.py
+++ b/tests/integration/test_distributed_backward_compatability/test.py
@@ -1,16 +1,14 @@
 import pytest
-import time
 
 from helpers.cluster import ClickHouseCluster
-from helpers.network import PartitionManager
-from helpers.test_tools import TSV
-
 
 cluster = ClickHouseCluster(__file__)
 
-node_old = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], image='yandex/clickhouse-server', tag='19.17.8.54', stay_alive=True, with_installed_binary=True)
+node_old = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], image='yandex/clickhouse-server',
+                                tag='19.17.8.54', stay_alive=True, with_installed_binary=True)
 node_new = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'])
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -22,14 +20,17 @@ def started_cluster():
         node_old.query("INSERT INTO local_table VALUES (1, 'node1')")
         node_new.query("INSERT INTO local_table VALUES (2, 'node2')")
 
-        node_old.query("CREATE TABLE distributed(id UInt32, val String) ENGINE = Distributed(test_cluster, default, local_table)")
-        node_new.query("CREATE TABLE distributed(id UInt32, val String) ENGINE = Distributed(test_cluster, default, local_table)")
+        node_old.query(
+            "CREATE TABLE distributed(id UInt32, val String) ENGINE = Distributed(test_cluster, default, local_table)")
+        node_new.query(
+            "CREATE TABLE distributed(id UInt32, val String) ENGINE = Distributed(test_cluster, default, local_table)")
 
         yield cluster
 
     finally:
         cluster.shutdown()
 
+
 def test_distributed_in_tuple(started_cluster):
     query1 = "SELECT count() FROM distributed WHERE (id, val) IN ((1, 'node1'), (2, 'a'), (3, 'b'))"
     query2 = "SELECT sum((id, val) IN ((1, 'node1'), (2, 'a'), (3, 'b'))) FROM distributed"
diff --git a/tests/integration/test_distributed_ddl/cluster.py b/tests/integration/test_distributed_ddl/cluster.py
index 258478de990..efd6ce7e65c 100644
--- a/tests/integration/test_distributed_ddl/cluster.py
+++ b/tests/integration/test_distributed_ddl/cluster.py
@@ -17,18 +17,21 @@ class ClickHouseClusterWithDDLHelpers(ClickHouseCluster):
 
     def prepare(self, replace_hostnames_with_ips=True):
         try:
-            main_configs_files = ["clusters.xml", "zookeeper_session_timeout.xml", "macro.xml", "query_log.xml","ddl.xml"]
+            main_configs_files = ["clusters.xml", "zookeeper_session_timeout.xml", "macro.xml", "query_log.xml",
+                                  "ddl.xml"]
             main_configs = [os.path.join(self.test_config_dir, "config.d", f) for f in main_configs_files]
-            user_configs = [os.path.join(self.test_config_dir, "users.d", f) for f in ["restricted_user.xml", "query_log.xml"]]
+            user_configs = [os.path.join(self.test_config_dir, "users.d", f) for f in
+                            ["restricted_user.xml", "query_log.xml"]]
             if self.test_config_dir == "configs_secure":
-                main_configs += [os.path.join(self.test_config_dir, f) for f in ["server.crt", "server.key", "dhparam.pem", "config.d/ssl_conf.xml"]]
+                main_configs += [os.path.join(self.test_config_dir, f) for f in
+                                 ["server.crt", "server.key", "dhparam.pem", "config.d/ssl_conf.xml"]]
 
             for i in xrange(4):
                 self.add_instance(
-                    'ch{}'.format(i+1),
+                    'ch{}'.format(i + 1),
                     main_configs=main_configs,
                     user_configs=user_configs,
-                    macros={"layer": 0, "shard": i/2 + 1, "replica": i%2 + 1},
+                    macros={"layer": 0, "shard": i / 2 + 1, "replica": i % 2 + 1},
                     with_zookeeper=True)
 
             self.start()
@@ -40,8 +43,12 @@ class ClickHouseClusterWithDDLHelpers(ClickHouseCluster):
             # Select sacrifice instance to test CONNECTION_LOSS and server fail on it
             sacrifice = self.instances['ch4']
             self.pm_random_drops = PartitionManager()
-            self.pm_random_drops._add_rule({'probability': 0.01, 'destination': sacrifice.ip_address, 'source_port': 2181, 'action': 'REJECT --reject-with tcp-reset'})
-            self.pm_random_drops._add_rule({'probability': 0.01, 'source': sacrifice.ip_address, 'destination_port': 2181, 'action': 'REJECT --reject-with tcp-reset'})
+            self.pm_random_drops._add_rule(
+                {'probability': 0.01, 'destination': sacrifice.ip_address, 'source_port': 2181,
+                 'action': 'REJECT --reject-with tcp-reset'})
+            self.pm_random_drops._add_rule(
+                {'probability': 0.01, 'source': sacrifice.ip_address, 'destination_port': 2181,
+                 'action': 'REJECT --reject-with tcp-reset'})
 
             # Initialize databases and service tables
             instance = self.instances['ch1']
@@ -67,7 +74,7 @@ class ClickHouseClusterWithDDLHelpers(ClickHouseCluster):
             num_hosts = len(self.instances)
 
         M = TSV.toMat(tsv_content)
-        hosts = [(l[0], l[1]) for l in M] # (host, port)
+        hosts = [(l[0], l[1]) for l in M]  # (host, port)
         codes = [l[2] for l in M]
         messages = [l[3] for l in M]
 
@@ -88,14 +95,17 @@ class ClickHouseClusterWithDDLHelpers(ClickHouseCluster):
 
         for inst_name in instances_to_replace:
             inst = self.instances[inst_name]
-            self.instances[inst_name].exec_in_container(['bash', '-c', 'echo "$NEW_CONFIG" > /etc/clickhouse-server/config.d/clusters.xml'], environment={"NEW_CONFIG": clusters_config}, privileged=True)
+            self.instances[inst_name].exec_in_container(
+                ['bash', '-c', 'echo "$NEW_CONFIG" > /etc/clickhouse-server/config.d/clusters.xml'],
+                environment={"NEW_CONFIG": clusters_config}, privileged=True)
             # print cluster.instances[inst_name].exec_in_container(['cat', "/etc/clickhouse-server/config.d/clusters.xml"])
 
     @staticmethod
     def ddl_check_there_are_no_dublicates(instance):
         query = "SELECT max(c), argMax(q, c) FROM (SELECT lower(query) AS q, count() AS c FROM system.query_log WHERE type=2 AND q LIKE '/* ddl_entry=query-%' GROUP BY query)"
         rows = instance.query(query)
-        assert len(rows) > 0 and rows[0][0] == "1", "dublicates on {} {}, query {}".format(instance.name, instance.ip_address, query)
+        assert len(rows) > 0 and rows[0][0] == "1", "dublicates on {} {}, query {}".format(instance.name,
+                                                                                           instance.ip_address, query)
 
     @staticmethod
     def insert_reliable(instance, query_insert):
diff --git a/tests/integration/test_distributed_ddl/test.py b/tests/integration/test_distributed_ddl/test.py
index f5dbe0ef8d2..08027fa13ca 100755
--- a/tests/integration/test_distributed_ddl/test.py
+++ b/tests/integration/test_distributed_ddl/test.py
@@ -41,7 +41,8 @@ def test_default_database(test_cluster):
 
     test_cluster.ddl_check_query(instance, "CREATE DATABASE IF NOT EXISTS test2 ON CLUSTER 'cluster' FORMAT TSV")
     test_cluster.ddl_check_query(instance, "DROP TABLE IF EXISTS null ON CLUSTER 'cluster' FORMAT TSV")
-    test_cluster.ddl_check_query(instance, "CREATE TABLE null ON CLUSTER 'cluster2' (s String DEFAULT 'escape\t\nme') ENGINE = Null")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE null ON CLUSTER 'cluster2' (s String DEFAULT 'escape\t\nme') ENGINE = Null")
 
     contents = instance.query("SELECT hostName() AS h, database FROM all_tables WHERE name = 'null' ORDER BY h")
     assert TSV(contents) == TSV("ch1\tdefault\nch2\ttest2\nch3\tdefault\nch4\ttest2\n")
@@ -52,13 +53,18 @@ def test_default_database(test_cluster):
 
 def test_create_view(test_cluster):
     instance = test_cluster.instances['ch3']
-    test_cluster.ddl_check_query(instance, "CREATE VIEW test.super_simple_view ON CLUSTER 'cluster' AS SELECT * FROM system.numbers FORMAT TSV")
-    test_cluster.ddl_check_query(instance, "CREATE MATERIALIZED VIEW test.simple_mat_view ON CLUSTER 'cluster' ENGINE = Memory AS SELECT * FROM system.numbers FORMAT TSV")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE VIEW test.super_simple_view ON CLUSTER 'cluster' AS SELECT * FROM system.numbers FORMAT TSV")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE MATERIALIZED VIEW test.simple_mat_view ON CLUSTER 'cluster' ENGINE = Memory AS SELECT * FROM system.numbers FORMAT TSV")
     test_cluster.ddl_check_query(instance, "DROP TABLE test.simple_mat_view ON CLUSTER 'cluster' FORMAT TSV")
-    test_cluster.ddl_check_query(instance, "DROP TABLE IF EXISTS test.super_simple_view2 ON CLUSTER 'cluster' FORMAT TSV")
+    test_cluster.ddl_check_query(instance,
+                                 "DROP TABLE IF EXISTS test.super_simple_view2 ON CLUSTER 'cluster' FORMAT TSV")
 
-    test_cluster.ddl_check_query(instance, "CREATE TABLE test.super_simple ON CLUSTER 'cluster' (i Int8) ENGINE = Memory")
-    test_cluster.ddl_check_query(instance, "RENAME TABLE test.super_simple TO test.super_simple2 ON CLUSTER 'cluster' FORMAT TSV")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE test.super_simple ON CLUSTER 'cluster' (i Int8) ENGINE = Memory")
+    test_cluster.ddl_check_query(instance,
+                                 "RENAME TABLE test.super_simple TO test.super_simple2 ON CLUSTER 'cluster' FORMAT TSV")
     test_cluster.ddl_check_query(instance, "DROP TABLE test.super_simple2 ON CLUSTER 'cluster'")
 
 
@@ -69,7 +75,8 @@ def test_on_server_fail(test_cluster):
     test_cluster.ddl_check_query(instance, "DROP TABLE IF EXISTS test.test_server_fail ON CLUSTER 'cluster'")
 
     kill_instance.get_docker_handle().stop()
-    request = instance.get_query_request("CREATE TABLE test.test_server_fail ON CLUSTER 'cluster' (i Int8) ENGINE=Null", timeout=30)
+    request = instance.get_query_request("CREATE TABLE test.test_server_fail ON CLUSTER 'cluster' (i Int8) ENGINE=Null",
+                                         timeout=30)
     kill_instance.get_docker_handle().start()
 
     test_cluster.ddl_check_query(instance, "DROP TABLE IF EXISTS test.__nope__ ON CLUSTER 'cluster'")
@@ -78,7 +85,8 @@ def test_on_server_fail(test_cluster):
     test_cluster.check_all_hosts_successfully_executed(request.get_answer())
 
     # And check query artefacts
-    contents = instance.query("SELECT hostName() AS h FROM all_tables WHERE database='test' AND name='test_server_fail' ORDER BY h")
+    contents = instance.query(
+        "SELECT hostName() AS h FROM all_tables WHERE database='test' AND name='test_server_fail' ORDER BY h")
     assert TSV(contents) == TSV("ch1\nch2\nch3\nch4\n")
 
     test_cluster.ddl_check_query(instance, "DROP TABLE test.test_server_fail ON CLUSTER 'cluster'")
@@ -98,11 +106,11 @@ def _test_on_connection_losses(test_cluster, zk_timeout):
 
 
 def test_on_connection_loss(test_cluster):
-    _test_on_connection_losses(test_cluster, 1.5) # connection loss will occur only (3 sec ZK timeout in config)
+    _test_on_connection_losses(test_cluster, 1.5)  # connection loss will occur only (3 sec ZK timeout in config)
 
 
 def test_on_session_expired(test_cluster):
-    _test_on_connection_losses(test_cluster, 4) # session should be expired (3 sec ZK timeout in config)
+    _test_on_connection_losses(test_cluster, 4)  # session should be expired (3 sec ZK timeout in config)
 
 
 def test_simple_alters(test_cluster):
@@ -127,28 +135,31 @@ ENGINE = Distributed('{cluster}', default, merge, i)
 
     for i in xrange(0, 4, 2):
         k = (i / 2) * 2
-        test_cluster.instances['ch{}'.format(i + 1)].query("INSERT INTO merge (i) VALUES ({})({})".format(k, k+1))
-
-    assert TSV(instance.query("SELECT i FROM all_merge_32 ORDER BY i")) == TSV(''.join(['{}\n'.format(x) for x in xrange(4)]))
+        test_cluster.instances['ch{}'.format(i + 1)].query("INSERT INTO merge (i) VALUES ({})({})".format(k, k + 1))
 
+    assert TSV(instance.query("SELECT i FROM all_merge_32 ORDER BY i")) == TSV(
+        ''.join(['{}\n'.format(x) for x in xrange(4)]))
 
     time.sleep(5)
     test_cluster.ddl_check_query(instance, "ALTER TABLE merge ON CLUSTER '{cluster}' MODIFY COLUMN i Int64")
     time.sleep(5)
-    test_cluster.ddl_check_query(instance, "ALTER TABLE merge ON CLUSTER '{cluster}' ADD COLUMN s String DEFAULT toString(i) FORMAT TSV")
-
-    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(''.join(['{}\t{}\n'.format(x,x) for x in xrange(4)]))
+    test_cluster.ddl_check_query(instance,
+                                 "ALTER TABLE merge ON CLUSTER '{cluster}' ADD COLUMN s String DEFAULT toString(i) FORMAT TSV")
 
+    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(
+        ''.join(['{}\t{}\n'.format(x, x) for x in xrange(4)]))
 
     for i in xrange(0, 4, 2):
         k = (i / 2) * 2 + 4
-        test_cluster.instances['ch{}'.format(i + 1)].query("INSERT INTO merge (p, i) VALUES (31, {})(31, {})".format(k, k+1))
-
-    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(''.join(['{}\t{}\n'.format(x,x) for x in xrange(8)]))
+        test_cluster.instances['ch{}'.format(i + 1)].query(
+            "INSERT INTO merge (p, i) VALUES (31, {})(31, {})".format(k, k + 1))
 
+    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(
+        ''.join(['{}\t{}\n'.format(x, x) for x in xrange(8)]))
 
     test_cluster.ddl_check_query(instance, "ALTER TABLE merge ON CLUSTER '{cluster}' DETACH PARTITION 197002")
-    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(''.join(['{}\t{}\n'.format(x,x) for x in xrange(4)]))
+    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(
+        ''.join(['{}\t{}\n'.format(x, x) for x in xrange(4)]))
 
     test_cluster.ddl_check_query(instance, "DROP TABLE merge ON CLUSTER '{cluster}'")
     test_cluster.ddl_check_query(instance, "DROP TABLE all_merge_32 ON CLUSTER '{cluster}'")
@@ -160,9 +171,11 @@ def test_macro(test_cluster):
     test_cluster.ddl_check_query(instance, "CREATE TABLE tab ON CLUSTER '{cluster}' (value UInt8) ENGINE = Memory")
 
     for i in xrange(4):
-        test_cluster.insert_reliable(test_cluster.instances['ch{}'.format(i + 1)], "INSERT INTO tab VALUES ({})".format(i))
+        test_cluster.insert_reliable(test_cluster.instances['ch{}'.format(i + 1)],
+                                     "INSERT INTO tab VALUES ({})".format(i))
 
-    test_cluster.ddl_check_query(instance, "CREATE TABLE distr ON CLUSTER '{cluster}' (value UInt8) ENGINE = Distributed('{cluster}', 'default', 'tab', value % 4)")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE distr ON CLUSTER '{cluster}' (value UInt8) ENGINE = Distributed('{cluster}', 'default', 'tab', value % 4)")
 
     assert TSV(instance.query("SELECT value FROM distr ORDER BY value")) == TSV('0\n1\n2\n3\n')
     assert TSV(test_cluster.instances['ch3'].query("SELECT value FROM distr ORDER BY value")) == TSV('0\n1\n2\n3\n')
@@ -197,22 +210,27 @@ def test_allowed_databases(test_cluster):
     instance.query("CREATE DATABASE IF NOT EXISTS db1 ON CLUSTER cluster")
     instance.query("CREATE DATABASE IF NOT EXISTS db2 ON CLUSTER cluster")
 
-    instance.query("CREATE TABLE db1.t1 ON CLUSTER cluster (i Int8) ENGINE = Memory", settings={"user" : "restricted_user"})
+    instance.query("CREATE TABLE db1.t1 ON CLUSTER cluster (i Int8) ENGINE = Memory",
+                   settings={"user": "restricted_user"})
 
     with pytest.raises(Exception):
-        instance.query("CREATE TABLE db2.t2 ON CLUSTER cluster (i Int8) ENGINE = Memory", settings={"user" : "restricted_user"})
+        instance.query("CREATE TABLE db2.t2 ON CLUSTER cluster (i Int8) ENGINE = Memory",
+                       settings={"user": "restricted_user"})
     with pytest.raises(Exception):
-        instance.query("CREATE TABLE t3 ON CLUSTER cluster (i Int8) ENGINE = Memory", settings={"user" : "restricted_user"})
+        instance.query("CREATE TABLE t3 ON CLUSTER cluster (i Int8) ENGINE = Memory",
+                       settings={"user": "restricted_user"})
     with pytest.raises(Exception):
-        instance.query("DROP DATABASE db2 ON CLUSTER cluster", settings={"user" : "restricted_user"})
+        instance.query("DROP DATABASE db2 ON CLUSTER cluster", settings={"user": "restricted_user"})
+
+    instance.query("DROP DATABASE db1 ON CLUSTER cluster", settings={"user": "restricted_user"})
 
-    instance.query("DROP DATABASE db1 ON CLUSTER cluster", settings={"user" : "restricted_user"})
 
 def test_kill_query(test_cluster):
     instance = test_cluster.instances['ch3']
 
     test_cluster.ddl_check_query(instance, "KILL QUERY ON CLUSTER 'cluster' WHERE NOT elapsed FORMAT TSV")
 
+
 def test_detach_query(test_cluster):
     instance = test_cluster.instances['ch3']
 
@@ -226,21 +244,25 @@ def test_optimize_query(test_cluster):
     instance = test_cluster.instances['ch3']
 
     test_cluster.ddl_check_query(instance, "DROP TABLE IF EXISTS test_optimize ON CLUSTER cluster FORMAT TSV")
-    test_cluster.ddl_check_query(instance, "CREATE TABLE test_optimize ON CLUSTER cluster (p Date, i Int32) ENGINE = MergeTree(p, p, 8192)")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE test_optimize ON CLUSTER cluster (p Date, i Int32) ENGINE = MergeTree(p, p, 8192)")
     test_cluster.ddl_check_query(instance, "OPTIMIZE TABLE test_optimize ON CLUSTER cluster FORMAT TSV")
 
 
 def test_create_as_select(test_cluster):
     instance = test_cluster.instances['ch2']
-    test_cluster.ddl_check_query(instance, "CREATE TABLE test_as_select ON CLUSTER cluster ENGINE = Memory AS (SELECT 1 AS x UNION ALL SELECT 2 AS x)")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE test_as_select ON CLUSTER cluster ENGINE = Memory AS (SELECT 1 AS x UNION ALL SELECT 2 AS x)")
     assert TSV(instance.query("SELECT x FROM test_as_select ORDER BY x")) == TSV("1\n2\n")
     test_cluster.ddl_check_query(instance, "DROP TABLE IF EXISTS test_as_select ON CLUSTER cluster")
 
 
 def test_create_reserved(test_cluster):
     instance = test_cluster.instances['ch2']
-    test_cluster.ddl_check_query(instance, "CREATE TABLE test_reserved ON CLUSTER cluster (`p` Date, `image` Nullable(String), `index` Nullable(Float64), `invalidate` Nullable(Int64)) ENGINE = MergeTree(`p`, `p`, 8192)")
-    test_cluster.ddl_check_query(instance, "CREATE TABLE test_as_reserved ON CLUSTER cluster ENGINE = Memory AS (SELECT * from test_reserved)")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE test_reserved ON CLUSTER cluster (`p` Date, `image` Nullable(String), `index` Nullable(Float64), `invalidate` Nullable(Int64)) ENGINE = MergeTree(`p`, `p`, 8192)")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE test_as_reserved ON CLUSTER cluster ENGINE = Memory AS (SELECT * from test_reserved)")
     test_cluster.ddl_check_query(instance, "DROP TABLE IF EXISTS test_reserved ON CLUSTER cluster")
     test_cluster.ddl_check_query(instance, "DROP TABLE IF EXISTS test_as_reserved ON CLUSTER cluster")
 
@@ -248,11 +270,12 @@ def test_create_reserved(test_cluster):
 def test_rename(test_cluster):
     instance = test_cluster.instances['ch1']
     rules = test_cluster.pm_random_drops.pop_rules()
-    test_cluster.ddl_check_query(instance, "CREATE TABLE rename_shard ON CLUSTER cluster (id Int64, sid String DEFAULT concat('old', toString(id))) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{shard}/staging/test_shard', '{replica}') ORDER BY (id)")
-    test_cluster.ddl_check_query(instance, "CREATE TABLE rename_new ON CLUSTER cluster AS rename_shard ENGINE = Distributed(cluster, default, rename_shard, id % 2)")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE rename_shard ON CLUSTER cluster (id Int64, sid String DEFAULT concat('old', toString(id))) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{shard}/staging/test_shard', '{replica}') ORDER BY (id)")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE rename_new ON CLUSTER cluster AS rename_shard ENGINE = Distributed(cluster, default, rename_shard, id % 2)")
     test_cluster.ddl_check_query(instance, "RENAME TABLE rename_new TO rename ON CLUSTER cluster;")
 
-
     for i in range(10):
         instance.query("insert into rename (id) values ({})".format(i))
 
@@ -261,10 +284,13 @@ def test_rename(test_cluster):
     # so ddl query will always fail on some replicas even if query was actually executed by leader
     # Also such inconsistency in cluster configuration may lead to query duplication if leader suddenly changed
     # because path of lock in zk contains shard name, which is list of host names of replicas
-    instance.query("ALTER TABLE rename_shard ON CLUSTER cluster MODIFY COLUMN sid String DEFAULT concat('new', toString(id))", ignore_error=True)
+    instance.query(
+        "ALTER TABLE rename_shard ON CLUSTER cluster MODIFY COLUMN sid String DEFAULT concat('new', toString(id))",
+        ignore_error=True)
     time.sleep(1)
 
-    test_cluster.ddl_check_query(instance, "CREATE TABLE rename_new ON CLUSTER cluster AS rename_shard ENGINE = Distributed(cluster, default, rename_shard, id % 2)")
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE rename_new ON CLUSTER cluster AS rename_shard ENGINE = Distributed(cluster, default, rename_shard, id % 2)")
 
     instance.query("system stop distributed sends rename")
 
@@ -283,36 +309,43 @@ def test_rename(test_cluster):
     # system stop distributed sends does not affect inserts into local shard,
     # so some ids in range (10, 20) will be inserted into rename_shard
     assert instance.query("select count(id), sum(id) from rename").rstrip() == "25\t360"
-    #assert instance.query("select count(id), sum(id) from rename").rstrip() == "20\t290"
+    # assert instance.query("select count(id), sum(id) from rename").rstrip() == "20\t290"
     assert instance.query("select count(id), sum(id) from rename where sid like 'old%'").rstrip() == "15\t115"
-    #assert instance.query("select count(id), sum(id) from rename where sid like 'old%'").rstrip() == "10\t45"
+    # assert instance.query("select count(id), sum(id) from rename where sid like 'old%'").rstrip() == "10\t45"
     assert instance.query("select count(id), sum(id) from rename where sid like 'new%'").rstrip() == "10\t245"
     test_cluster.pm_random_drops.push_rules(rules)
 
+
 def test_socket_timeout(test_cluster):
     instance = test_cluster.instances['ch1']
     # queries should not fail with "Timeout exceeded while reading from socket" in case of EINTR caused by query profiler
     for i in range(0, 100):
         instance.query("select hostName() as host, count() from cluster('cluster', 'system', 'settings') group by host")
 
+
 def test_replicated_without_arguments(test_cluster):
     rules = test_cluster.pm_random_drops.pop_rules()
     instance = test_cluster.instances['ch1']
     test_cluster.ddl_check_query(instance, "CREATE DATABASE test_atomic ON CLUSTER cluster ENGINE=Atomic",
                                  settings={'show_table_uuid_in_table_create_query_if_not_nil': 1})
-    test_cluster.ddl_check_query(instance, "CREATE TABLE test_atomic.rmt ON CLUSTER cluster (n UInt64, s String) ENGINE=ReplicatedMergeTree ORDER BY n",
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE test_atomic.rmt ON CLUSTER cluster (n UInt64, s String) ENGINE=ReplicatedMergeTree ORDER BY n",
                                  settings={'show_table_uuid_in_table_create_query_if_not_nil': 1})
     test_cluster.ddl_check_query(instance, "DROP TABLE test_atomic.rmt ON CLUSTER cluster")
-    test_cluster.ddl_check_query(instance, "CREATE TABLE test_atomic.rmt ON CLUSTER cluster (n UInt64, s String) ENGINE=ReplicatedMergeTree ORDER BY n",
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE test_atomic.rmt ON CLUSTER cluster (n UInt64, s String) ENGINE=ReplicatedMergeTree ORDER BY n",
                                  settings={'show_table_uuid_in_table_create_query_if_not_nil': 1})
     test_cluster.ddl_check_query(instance, "RENAME TABLE test_atomic.rmt TO test_atomic.rmt_renamed ON CLUSTER cluster")
-    test_cluster.ddl_check_query(instance, "CREATE TABLE test_atomic.rmt ON CLUSTER cluster (n UInt64, s String) ENGINE=ReplicatedMergeTree ORDER BY n",
+    test_cluster.ddl_check_query(instance,
+                                 "CREATE TABLE test_atomic.rmt ON CLUSTER cluster (n UInt64, s String) ENGINE=ReplicatedMergeTree ORDER BY n",
                                  settings={'show_table_uuid_in_table_create_query_if_not_nil': 1})
-    test_cluster.ddl_check_query(instance, "EXCHANGE TABLES test_atomic.rmt AND test_atomic.rmt_renamed ON CLUSTER cluster")
+    test_cluster.ddl_check_query(instance,
+                                 "EXCHANGE TABLES test_atomic.rmt AND test_atomic.rmt_renamed ON CLUSTER cluster")
     test_cluster.pm_random_drops.push_rules(rules)
 
+
 if __name__ == '__main__':
     with contextmanager(test_cluster)() as ctx_cluster:
-       for name, instance in ctx_cluster.instances.items():
-           print name, instance.ip_address
-       raw_input("Cluster created, press any key to destroy...")
+        for name, instance in ctx_cluster.instances.items():
+            print name, instance.ip_address
+        raw_input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_distributed_ddl/test_replicated_alter.py b/tests/integration/test_distributed_ddl/test_replicated_alter.py
index e66e731cbb1..840803f61ef 100644
--- a/tests/integration/test_distributed_ddl/test_replicated_alter.py
+++ b/tests/integration/test_distributed_ddl/test_replicated_alter.py
@@ -1,6 +1,7 @@
 import os
 import sys
 import time
+
 import pytest
 
 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
@@ -60,29 +61,34 @@ ENGINE = Distributed(cluster, default, merge_for_alter, i)
 
     for i in xrange(4):
         k = (i / 2) * 2
-        test_cluster.insert_reliable(test_cluster.instances['ch{}'.format(i + 1)], "INSERT INTO merge_for_alter (i) VALUES ({})({})".format(k, k+1))
+        test_cluster.insert_reliable(test_cluster.instances['ch{}'.format(i + 1)],
+                                     "INSERT INTO merge_for_alter (i) VALUES ({})({})".format(k, k + 1))
 
     test_cluster.sync_replicas("merge_for_alter")
 
-    assert TSV(instance.query("SELECT i FROM all_merge_32 ORDER BY i")) == TSV(''.join(['{}\n'.format(x) for x in xrange(4)]))
-
+    assert TSV(instance.query("SELECT i FROM all_merge_32 ORDER BY i")) == TSV(
+        ''.join(['{}\n'.format(x) for x in xrange(4)]))
 
     test_cluster.ddl_check_query(instance, "ALTER TABLE merge_for_alter ON CLUSTER cluster MODIFY COLUMN i Int64")
-    test_cluster.ddl_check_query(instance, "ALTER TABLE merge_for_alter ON CLUSTER cluster ADD COLUMN s String DEFAULT toString(i)")
-
-    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(''.join(['{}\t{}\n'.format(x,x) for x in xrange(4)]))
+    test_cluster.ddl_check_query(instance,
+                                 "ALTER TABLE merge_for_alter ON CLUSTER cluster ADD COLUMN s String DEFAULT toString(i)")
 
+    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(
+        ''.join(['{}\t{}\n'.format(x, x) for x in xrange(4)]))
 
     for i in xrange(4):
         k = (i / 2) * 2 + 4
-        test_cluster.insert_reliable(test_cluster.instances['ch{}'.format(i + 1)], "INSERT INTO merge_for_alter (p, i) VALUES (31, {})(31, {})".format(k, k+1))
+        test_cluster.insert_reliable(test_cluster.instances['ch{}'.format(i + 1)],
+                                     "INSERT INTO merge_for_alter (p, i) VALUES (31, {})(31, {})".format(k, k + 1))
 
     test_cluster.sync_replicas("merge_for_alter")
 
-    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(''.join(['{}\t{}\n'.format(x,x) for x in xrange(8)]))
+    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(
+        ''.join(['{}\t{}\n'.format(x, x) for x in xrange(8)]))
 
     test_cluster.ddl_check_query(instance, "ALTER TABLE merge_for_alter ON CLUSTER cluster DETACH PARTITION 197002")
-    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(''.join(['{}\t{}\n'.format(x,x) for x in xrange(4)]))
+    assert TSV(instance.query("SELECT i, s FROM all_merge_64 ORDER BY i")) == TSV(
+        ''.join(['{}\t{}\n'.format(x, x) for x in xrange(4)]))
 
     test_cluster.ddl_check_query(instance, "DROP TABLE merge_for_alter ON CLUSTER cluster")
 
diff --git a/tests/integration/test_distributed_ddl_on_cross_replication/test.py b/tests/integration/test_distributed_ddl_on_cross_replication/test.py
index 4aa64362060..16238f0326d 100644
--- a/tests/integration/test_distributed_ddl_on_cross_replication/test.py
+++ b/tests/integration/test_distributed_ddl_on_cross_replication/test.py
@@ -1,4 +1,3 @@
-import time
 import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
@@ -12,6 +11,7 @@ node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'
 node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml'], with_zookeeper=True,
                              macros={"shard": 3, "replica": 1, "shard_bk": 2, "replica_bk": 2})
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -49,7 +49,8 @@ def started_cluster():
 2017-06-17	31	2
 '''
 
-        node1.query("INSERT INTO replica_1.replicated FORMAT TSV", stdin=to_insert, settings={"insert_distributed_sync" : 1})
+        node1.query("INSERT INTO replica_1.replicated FORMAT TSV", stdin=to_insert,
+                    settings={"insert_distributed_sync": 1})
         yield cluster
 
     finally:
@@ -64,7 +65,8 @@ def test_alter_ddl(started_cluster):
                 WHERE part_key='2017-06-16'")
 
     node1.query("SYSTEM SYNC REPLICA replica_2.replicated_local;", timeout=5)
-    assert_eq_with_retry(node1, "SELECT count(*) FROM replica_2.replicated where shard_id >= 3 and part_key='2017-06-16'", '3')
+    assert_eq_with_retry(node1,
+                         "SELECT count(*) FROM replica_2.replicated where shard_id >= 3 and part_key='2017-06-16'", '3')
 
     node1.query("ALTER TABLE replica_1.replicated_local  \
                 ON CLUSTER cross_3shards_2replicas DELETE WHERE shard_id >=3;")
@@ -75,4 +77,3 @@ def test_alter_ddl(started_cluster):
 
     node2.query("SYSTEM SYNC REPLICA replica_2.replicated_local;", timeout=5)
     assert_eq_with_retry(node1, "SELECT count(*) FROM replica_2.replicated", '0')
-
diff --git a/tests/integration/test_distributed_ddl_password/test.py b/tests/integration/test_distributed_ddl_password/test.py
index 961b60857dd..0c061914497 100644
--- a/tests/integration/test_distributed_ddl_password/test.py
+++ b/tests/integration/test_distributed_ddl_password/test.py
@@ -1,17 +1,21 @@
-import time
 import pytest
+from helpers.client import QueryRuntimeException
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
-from helpers.client import QueryRuntimeException
-
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', main_configs=["configs/config.d/clusters.xml"], user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
-node2 = cluster.add_instance('node2', main_configs=["configs/config.d/clusters.xml"], user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
-node3 = cluster.add_instance('node3', main_configs=["configs/config.d/clusters.xml"], user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
-node4 = cluster.add_instance('node4', main_configs=["configs/config.d/clusters.xml"], user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
-node5 = cluster.add_instance('node5', main_configs=["configs/config.d/clusters.xml"], user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
-node6 = cluster.add_instance('node6', main_configs=["configs/config.d/clusters.xml"], user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
+node1 = cluster.add_instance('node1', main_configs=["configs/config.d/clusters.xml"],
+                             user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
+node2 = cluster.add_instance('node2', main_configs=["configs/config.d/clusters.xml"],
+                             user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
+node3 = cluster.add_instance('node3', main_configs=["configs/config.d/clusters.xml"],
+                             user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
+node4 = cluster.add_instance('node4', main_configs=["configs/config.d/clusters.xml"],
+                             user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
+node5 = cluster.add_instance('node5', main_configs=["configs/config.d/clusters.xml"],
+                             user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
+node6 = cluster.add_instance('node6', main_configs=["configs/config.d/clusters.xml"],
+                             user_configs=["configs/users.d/default_with_password.xml"], with_zookeeper=True)
 
 
 @pytest.fixture(scope="module")
@@ -21,27 +25,29 @@ def start_cluster():
 
         for node, shard in [(node1, 1), (node2, 1), (node3, 2), (node4, 2), (node5, 3), (node6, 3)]:
             node.query(
-            '''
-                CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
-                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}')
-                PARTITION BY date
-                ORDER BY id
-            '''.format(shard=shard, replica=node.name), settings={"password": "clickhouse"})
+                '''
+                    CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
+                    ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}')
+                    PARTITION BY date
+                    ORDER BY id
+                '''.format(shard=shard, replica=node.name), settings={"password": "clickhouse"})
 
         yield cluster
 
     finally:
         cluster.shutdown()
 
+
 def test_truncate(start_cluster):
-    node1.query("insert into test_table values ('2019-02-15', 1, 2), ('2019-02-15', 2, 3), ('2019-02-15', 3, 4)", settings={"password": "clickhouse"})
+    node1.query("insert into test_table values ('2019-02-15', 1, 2), ('2019-02-15', 2, 3), ('2019-02-15', 3, 4)",
+                settings={"password": "clickhouse"})
 
     assert node1.query("select count(*) from test_table", settings={"password": "clickhouse"}) == "3\n"
     node2.query("system sync replica test_table", settings={"password": "clickhouse"})
     assert node2.query("select count(*) from test_table", settings={"password": "clickhouse"}) == "3\n"
 
-
-    node3.query("insert into test_table values ('2019-02-16', 1, 2), ('2019-02-16', 2, 3), ('2019-02-16', 3, 4)", settings={"password": "clickhouse"})
+    node3.query("insert into test_table values ('2019-02-16', 1, 2), ('2019-02-16', 2, 3), ('2019-02-16', 3, 4)",
+                settings={"password": "clickhouse"})
 
     assert node3.query("select count(*) from test_table", settings={"password": "clickhouse"}) == "3\n"
     node4.query("system sync replica test_table", settings={"password": "clickhouse"})
@@ -55,11 +61,15 @@ def test_truncate(start_cluster):
     node2.query("drop table test_table on cluster 'awesome_cluster'", settings={"password": "clickhouse"})
 
     for node in [node1, node2, node3, node4]:
-        assert_eq_with_retry(node, "select count(*) from system.tables where name='test_table'", "0", settings={"password": "clickhouse"})
+        assert_eq_with_retry(node, "select count(*) from system.tables where name='test_table'", "0",
+                             settings={"password": "clickhouse"})
+
 
 def test_alter(start_cluster):
-    node5.query("insert into test_table values ('2019-02-15', 1, 2), ('2019-02-15', 2, 3), ('2019-02-15', 3, 4)", settings={"password": "clickhouse"})
-    node6.query("insert into test_table values ('2019-02-15', 4, 2), ('2019-02-15', 5, 3), ('2019-02-15', 6, 4)", settings={"password": "clickhouse"})
+    node5.query("insert into test_table values ('2019-02-15', 1, 2), ('2019-02-15', 2, 3), ('2019-02-15', 3, 4)",
+                settings={"password": "clickhouse"})
+    node6.query("insert into test_table values ('2019-02-15', 4, 2), ('2019-02-15', 5, 3), ('2019-02-15', 6, 4)",
+                settings={"password": "clickhouse"})
 
     node5.query("SYSTEM SYNC REPLICA test_table", settings={"password": "clickhouse"})
     node6.query("SYSTEM SYNC REPLICA test_table", settings={"password": "clickhouse"})
@@ -75,24 +85,30 @@ def test_alter(start_cluster):
     assert_eq_with_retry(node5, "select count(*) from test_table", "6", settings={"password": "clickhouse"})
     assert_eq_with_retry(node6, "select count(*) from test_table", "6", settings={"password": "clickhouse"})
 
-    node6.query("ALTER TABLE test_table ON CLUSTER 'simple_cluster' DETACH PARTITION '2019-02-15'", settings={"password": "clickhouse"})
+    node6.query("ALTER TABLE test_table ON CLUSTER 'simple_cluster' DETACH PARTITION '2019-02-15'",
+                settings={"password": "clickhouse"})
     assert_eq_with_retry(node5, "select count(*) from test_table", "0", settings={"password": "clickhouse"})
     assert_eq_with_retry(node6, "select count(*) from test_table", "0", settings={"password": "clickhouse"})
 
     with pytest.raises(QueryRuntimeException):
-        node6.query("ALTER TABLE test_table ON CLUSTER 'simple_cluster' ATTACH PARTITION '2019-02-15'", settings={"password": "clickhouse"})
+        node6.query("ALTER TABLE test_table ON CLUSTER 'simple_cluster' ATTACH PARTITION '2019-02-15'",
+                    settings={"password": "clickhouse"})
 
     node5.query("ALTER TABLE test_table ATTACH PARTITION '2019-02-15'", settings={"password": "clickhouse"})
 
     assert_eq_with_retry(node5, "select count(*) from test_table", "6", settings={"password": "clickhouse"})
     assert_eq_with_retry(node6, "select count(*) from test_table", "6", settings={"password": "clickhouse"})
 
-    node5.query("ALTER TABLE test_table ON CLUSTER 'simple_cluster' MODIFY COLUMN dummy String", settings={"password": "clickhouse"})
+    node5.query("ALTER TABLE test_table ON CLUSTER 'simple_cluster' MODIFY COLUMN dummy String",
+                settings={"password": "clickhouse"})
 
-    assert_eq_with_retry(node5, "select length(dummy) from test_table ORDER BY dummy LIMIT 1", "1", settings={"password": "clickhouse"})
-    assert_eq_with_retry(node6, "select length(dummy) from test_table ORDER BY dummy LIMIT 1", "1", settings={"password": "clickhouse"})
+    assert_eq_with_retry(node5, "select length(dummy) from test_table ORDER BY dummy LIMIT 1", "1",
+                         settings={"password": "clickhouse"})
+    assert_eq_with_retry(node6, "select length(dummy) from test_table ORDER BY dummy LIMIT 1", "1",
+                         settings={"password": "clickhouse"})
 
-    node6.query("ALTER TABLE test_table ON CLUSTER 'simple_cluster' DROP PARTITION '2019-02-15'", settings={"password": "clickhouse"})
+    node6.query("ALTER TABLE test_table ON CLUSTER 'simple_cluster' DROP PARTITION '2019-02-15'",
+                settings={"password": "clickhouse"})
 
     assert_eq_with_retry(node5, "select count(*) from test_table", "0", settings={"password": "clickhouse"})
     assert_eq_with_retry(node6, "select count(*) from test_table", "0", settings={"password": "clickhouse"})
diff --git a/tests/integration/test_distributed_format/test.py b/tests/integration/test_distributed_format/test.py
index 251ec766b74..7658814a720 100644
--- a/tests/integration/test_distributed_format/test.py
+++ b/tests/integration/test_distributed_format/test.py
@@ -1,12 +1,6 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
-from multiprocessing.dummy import Pool
-from helpers.client import QueryRuntimeException, QueryTimeoutExceedException
-
-from helpers.test_tools import assert_eq_with_retry
-
 
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', main_configs=['configs/remote_servers.xml'])
@@ -27,10 +21,13 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 @cluster_param
 def test_single_file(started_cluster, cluster):
-    node.query("create table test.distr_1 (x UInt64, s String) engine = Distributed('{}', database, table)".format(cluster))
-    node.query("insert into test.distr_1 values (1, 'a'), (2, 'bb'), (3, 'ccc')", settings={"use_compact_format_in_distributed_parts_names": "1"})
+    node.query(
+        "create table test.distr_1 (x UInt64, s String) engine = Distributed('{}', database, table)".format(cluster))
+    node.query("insert into test.distr_1 values (1, 'a'), (2, 'bb'), (3, 'ccc')",
+               settings={"use_compact_format_in_distributed_parts_names": "1"})
 
     query = "select * from file('/var/lib/clickhouse/data/test/distr_1/shard1_replica1/1.bin', 'Distributed')"
     out = node.exec_in_container(['/usr/bin/clickhouse', 'local', '--stacktrace', '-q', query])
@@ -48,9 +45,12 @@ def test_single_file(started_cluster, cluster):
 
 @cluster_param
 def test_two_files(started_cluster, cluster):
-    node.query("create table test.distr_2 (x UInt64, s String) engine = Distributed('{}', database, table)".format(cluster))
-    node.query("insert into test.distr_2 values (0, '_'), (1, 'a')", settings={"use_compact_format_in_distributed_parts_names": "1"})
-    node.query("insert into test.distr_2 values (2, 'bb'), (3, 'ccc')", settings={"use_compact_format_in_distributed_parts_names": "1"})
+    node.query(
+        "create table test.distr_2 (x UInt64, s String) engine = Distributed('{}', database, table)".format(cluster))
+    node.query("insert into test.distr_2 values (0, '_'), (1, 'a')",
+               settings={"use_compact_format_in_distributed_parts_names": "1"})
+    node.query("insert into test.distr_2 values (2, 'bb'), (3, 'ccc')",
+               settings={"use_compact_format_in_distributed_parts_names": "1"})
 
     query = "select * from file('/var/lib/clickhouse/data/test/distr_2/shard1_replica1/{1,2,3,4}.bin', 'Distributed') order by x"
     out = node.exec_in_container(['/usr/bin/clickhouse', 'local', '--stacktrace', '-q', query])
@@ -68,7 +68,8 @@ def test_two_files(started_cluster, cluster):
 
 @cluster_param
 def test_single_file_old(started_cluster, cluster):
-    node.query("create table test.distr_3 (x UInt64, s String) engine = Distributed('{}', database, table)".format(cluster))
+    node.query(
+        "create table test.distr_3 (x UInt64, s String) engine = Distributed('{}', database, table)".format(cluster))
     node.query("insert into test.distr_3 values (1, 'a'), (2, 'bb'), (3, 'ccc')")
 
     query = "select * from file('/var/lib/clickhouse/data/test/distr_3/default@not_existing:9000/1.bin', 'Distributed')"
diff --git a/tests/integration/test_distributed_load_balancing/test.py b/tests/integration/test_distributed_load_balancing/test.py
index c538dc7fb3a..b227c57fb04 100644
--- a/tests/integration/test_distributed_load_balancing/test.py
+++ b/tests/integration/test_distributed_load_balancing/test.py
@@ -3,8 +3,8 @@
 # pylint: disable=line-too-long
 
 import uuid
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
@@ -14,7 +14,8 @@ n2 = cluster.add_instance('n2', main_configs=['configs/remote_servers.xml'])
 n3 = cluster.add_instance('n3', main_configs=['configs/remote_servers.xml'])
 
 nodes = len(cluster.instances)
-queries = nodes*5
+queries = nodes * 5
+
 
 def bootstrap():
     for n in cluster.instances.values():
@@ -58,9 +59,11 @@ def bootstrap():
             data)
         """.format())
 
+
 def make_uuid():
     return uuid.uuid4().hex
 
+
 @pytest.fixture(scope='module', autouse=True)
 def start_cluster():
     try:
@@ -70,6 +73,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def get_node(query_node, table='dist', *args, **kwargs):
     query_id = make_uuid()
 
@@ -106,6 +110,7 @@ def get_node(query_node, table='dist', *args, **kwargs):
     """.format(query_id=query_id))
     return rows.strip()
 
+
 # TODO: right now random distribution looks bad, but works
 def test_load_balancing_default():
     unique_nodes = set()
@@ -113,6 +118,7 @@ def test_load_balancing_default():
         unique_nodes.add(get_node(n1, settings={'load_balancing': 'random'}))
     assert len(unique_nodes) == nodes, unique_nodes
 
+
 def test_load_balancing_nearest_hostname():
     unique_nodes = set()
     for _ in range(0, queries):
@@ -120,6 +126,7 @@ def test_load_balancing_nearest_hostname():
     assert len(unique_nodes) == 1, unique_nodes
     assert unique_nodes == set(['n1'])
 
+
 def test_load_balancing_in_order():
     unique_nodes = set()
     for _ in range(0, queries):
@@ -127,6 +134,7 @@ def test_load_balancing_in_order():
     assert len(unique_nodes) == 1, unique_nodes
     assert unique_nodes == set(['n1'])
 
+
 def test_load_balancing_first_or_random():
     unique_nodes = set()
     for _ in range(0, queries):
@@ -134,6 +142,7 @@ def test_load_balancing_first_or_random():
     assert len(unique_nodes) == 1, unique_nodes
     assert unique_nodes == set(['n1'])
 
+
 def test_load_balancing_round_robin():
     unique_nodes = set()
     for _ in range(0, nodes):
@@ -141,6 +150,7 @@ def test_load_balancing_round_robin():
     assert len(unique_nodes) == nodes, unique_nodes
     assert unique_nodes == set(['n1', 'n2', 'n3'])
 
+
 @pytest.mark.parametrize('dist_table', [
     ('dist_priority'),
     ('dist_priority_negative'),
@@ -153,6 +163,7 @@ def test_load_balancing_priority_round_robin(dist_table):
     # n2 has bigger priority in config
     assert unique_nodes == set(['n1', 'n3'])
 
+
 def test_distributed_replica_max_ignored_errors():
     settings = {
         'load_balancing': 'in_order',
diff --git a/tests/integration/test_distributed_over_distributed/test.py b/tests/integration/test_distributed_over_distributed/test.py
index 31d6de55bea..716bc66d629 100644
--- a/tests/integration/test_distributed_over_distributed/test.py
+++ b/tests/integration/test_distributed_over_distributed/test.py
@@ -3,16 +3,8 @@
 
 from __future__ import print_function
 
-import itertools
-import timeit
-import logging
-
 import pytest
-
 from helpers.cluster import ClickHouseCluster
-from helpers.network import PartitionManager
-from helpers.test_tools import TSV
-
 
 cluster = ClickHouseCluster(__file__)
 
@@ -44,6 +36,7 @@ ENGINE = Distributed('test_cluster', default, distributed_table);
 
 INSERT_SQL_TEMPLATE = "INSERT INTO base_table VALUES ('{node_id}', {key}, {value})"
 
+
 @pytest.fixture(scope="session")
 def started_cluster():
     try:
@@ -59,11 +52,12 @@ def started_cluster():
 
 
 @pytest.mark.parametrize("node", NODES.values())
-@pytest.mark.parametrize("source", ["distributed_over_distributed_table", "cluster('test_cluster', default, distributed_table)"])
+@pytest.mark.parametrize("source",
+                         ["distributed_over_distributed_table", "cluster('test_cluster', default, distributed_table)"])
 class TestDistributedOverDistributedSuite:
     def test_select_with_order_by_node(self, started_cluster, node, source):
         assert node.query("SELECT * FROM {source} ORDER BY node, key".format(source=source)) \
-            == """node1	0	0
+               == """node1	0	0
 node1	0	0
 node1	1	1
 node1	1	1
@@ -75,7 +69,7 @@ node2	1	11
 
     def test_select_with_order_by_key(self, started_cluster, node, source):
         assert node.query("SELECT * FROM {source} ORDER BY key, node".format(source=source)) \
-            == """node1	0	0
+               == """node1	0	0
 node1	0	0
 node2	0	10
 node2	0	10
@@ -87,12 +81,12 @@ node2	1	11
 
     def test_select_with_group_by_node(self, started_cluster, node, source):
         assert node.query("SELECT node, SUM(value) FROM {source} GROUP BY node ORDER BY node".format(source=source)) \
-            == "node1	2\nnode2	42\n"
+               == "node1	2\nnode2	42\n"
 
     def test_select_with_group_by_key(self, started_cluster, node, source):
         assert node.query("SELECT key, SUM(value) FROM {source} GROUP BY key ORDER BY key".format(source=source)) \
-            == "0	20\n1	24\n"
+               == "0	20\n1	24\n"
 
     def test_select_sum(self, started_cluster, node, source):
         assert node.query("SELECT SUM(value) FROM {source}".format(source=source)) \
-            == "44\n"
+               == "44\n"
diff --git a/tests/integration/test_distributed_over_live_view/test.py b/tests/integration/test_distributed_over_live_view/test.py
index 46c0bada535..d01a8febd92 100644
--- a/tests/integration/test_distributed_over_live_view/test.py
+++ b/tests/integration/test_distributed_over_live_view/test.py
@@ -2,16 +2,10 @@ from __future__ import print_function
 
 import sys
 import time
-import itertools
-import timeit
-import logging
 
 import pytest
-
-from helpers.uclient import client, prompt, end_of_block
 from helpers.cluster import ClickHouseCluster
-from helpers.network import PartitionManager
-from helpers.test_tools import TSV
+from helpers.uclient import client, prompt, end_of_block
 
 cluster = ClickHouseCluster(__file__)
 
@@ -46,6 +40,7 @@ ENGINE = Distributed(test_cluster, default, base_table, rand());
 
 INSERT_SQL_TEMPLATE = "INSERT INTO base_table VALUES ('{node_id}', {key}, {value})"
 
+
 @pytest.fixture(scope="function")
 def started_cluster():
     try:
@@ -77,7 +72,8 @@ class TestLiveViewOverDistributedSuite:
 
             client1.send("DROP TABLE IF EXISTS distributed_over_lv")
             client1.expect(prompt)
-            client1.send("CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
+            client1.send(
+                "CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
             client1.expect(prompt)
 
             client1.send(select_query)
@@ -115,7 +111,8 @@ class TestLiveViewOverDistributedSuite:
 
             client1.send("DROP TABLE IF EXISTS distributed_over_lv")
             client1.expect(prompt)
-            client1.send("CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
+            client1.send(
+                "CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
             client1.expect(prompt)
 
             client1.send(select_query)
@@ -153,7 +150,8 @@ class TestLiveViewOverDistributedSuite:
 
             client1.send("DROP TABLE IF EXISTS distributed_over_lv")
             client1.expect(prompt)
-            client1.send("CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
+            client1.send(
+                "CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
             client1.expect(prompt)
 
             client1.send(select_query)
@@ -192,7 +190,8 @@ class TestLiveViewOverDistributedSuite:
 
             client1.send("DROP TABLE IF EXISTS distributed_over_lv")
             client1.expect(prompt)
-            client1.send("CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
+            client1.send(
+                "CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
             client1.expect(prompt)
 
             client1.send(select_query)
@@ -230,7 +229,8 @@ class TestLiveViewOverDistributedSuite:
 
             client1.send("DROP TABLE IF EXISTS distributed_over_lv")
             client1.expect(prompt)
-            client1.send("CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
+            client1.send(
+                "CREATE TABLE distributed_over_lv AS lv_over_base_table ENGINE = Distributed(test_cluster, default, lv_over_base_table)")
             client1.expect(prompt)
 
             client1.send("SELECT sum(value) FROM distributed_over_lv")
@@ -254,4 +254,3 @@ class TestLiveViewOverDistributedSuite:
             client1.send("SELECT sum(value) FROM distributed_over_lv")
             client1.expect(r"31" + end_of_block)
             client1.expect(prompt)
-
diff --git a/tests/integration/test_distributed_respect_user_timeouts/test.py b/tests/integration/test_distributed_respect_user_timeouts/test.py
index dc5168bfdad..e5d9d0c1857 100644
--- a/tests/integration/test_distributed_respect_user_timeouts/test.py
+++ b/tests/integration/test_distributed_respect_user_timeouts/test.py
@@ -1,13 +1,12 @@
 import itertools
-import timeit
 import os.path
-import pytest
+import timeit
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
 from helpers.test_tools import TSV
 
-
 cluster = ClickHouseCluster(__file__)
 
 NODES = {'node' + str(i): None for i in (1, 2)}
@@ -62,6 +61,7 @@ TIMEOUT_DIFF_UPPER_BOUND = {
     },
 }
 
+
 def _check_exception(exception, expected_tries=3):
     lines = exception.split('\n')
 
@@ -88,7 +88,6 @@ def _check_exception(exception, expected_tries=3):
 
 @pytest.fixture(scope="module", params=["configs", "configs_secure"])
 def started_cluster(request):
-
     cluster = ClickHouseCluster(__file__)
     cluster.__with_ssl_config = request.param == "configs_secure"
     main_configs = []
diff --git a/tests/integration/test_distributed_storage_configuration/test.py b/tests/integration/test_distributed_storage_configuration/test.py
index 716dd3e3075..a932e9a55c5 100644
--- a/tests/integration/test_distributed_storage_configuration/test.py
+++ b/tests/integration/test_distributed_storage_configuration/test.py
@@ -9,8 +9,9 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 
 node = cluster.add_instance('node',
-            main_configs=["configs/config.d/storage_configuration.xml"],
-            tmpfs=['/disk1:size=100M', '/disk2:size=100M'])
+                            main_configs=["configs/config.d/storage_configuration.xml"],
+                            tmpfs=['/disk1:size=100M', '/disk2:size=100M'])
+
 
 @pytest.fixture(scope='module')
 def start_cluster():
@@ -21,14 +22,17 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def _files_in_dist_mon(node, root, table):
     return int(node.exec_in_container([
         'bash',
         '-c',
         # `-maxdepth 1` to avoid /tmp/ subdirectory
-        'find /{root}/data/test/{table}/default@127%2E0%2E0%2E2:9000 -maxdepth 1 -type f 2>/dev/null | wc -l'.format(root=root, table=table)
+        'find /{root}/data/test/{table}/default@127%2E0%2E0%2E2:9000 -maxdepth 1 -type f 2>/dev/null | wc -l'.format(
+            root=root, table=table)
     ]).split('\n')[0])
 
+
 def test_insert(start_cluster):
     node.query('CREATE TABLE test.foo (key Int) Engine=Memory()')
     node.query("""
diff --git a/tests/integration/test_distributed_system_query/test.py b/tests/integration/test_distributed_system_query/test.py
index c6e28c44034..bf643fabf86 100644
--- a/tests/integration/test_distributed_system_query/test.py
+++ b/tests/integration/test_distributed_system_query/test.py
@@ -1,5 +1,3 @@
-from contextlib import contextmanager
-
 import pytest
 
 from helpers.cluster import ClickHouseCluster
@@ -18,7 +16,8 @@ def started_cluster():
         for node in (node1, node2):
             node.query('''CREATE TABLE local_table(id UInt32, val String) ENGINE = MergeTree ORDER BY id;''')
 
-        node1.query('''CREATE TABLE distributed_table(id UInt32, val String) ENGINE = Distributed(test_cluster, default, local_table, id);''')
+        node1.query(
+            '''CREATE TABLE distributed_table(id UInt32, val String) ENGINE = Distributed(test_cluster, default, local_table, id);''')
 
         yield cluster
 
@@ -38,4 +37,3 @@ def test_start_and_stop_replica_send(started_cluster):
     node1.query("SYSTEM START DISTRIBUTED SENDS distributed_table;")
     node1.query("SYSTEM FLUSH DISTRIBUTED distributed_table;")
     assert node1.query("SELECT COUNT() FROM distributed_table").rstrip() == '2'
-
diff --git a/tests/integration/test_drop_replica/test.py b/tests/integration/test_drop_replica/test.py
index 0c281fe9c9b..fac8802b2f9 100644
--- a/tests/integration/test_drop_replica/test.py
+++ b/tests/integration/test_drop_replica/test.py
@@ -1,53 +1,52 @@
 import time
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
-from helpers.cluster import ClickHouseKiller
-from helpers.test_tools import assert_eq_with_retry
 from helpers.network import PartitionManager
 
+
 def fill_nodes(nodes, shard):
     for node in nodes:
         node.query(
-        '''
-            CREATE DATABASE test;
-
-            CREATE TABLE test.test_table(date Date, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
-        '''.format(shard=shard, replica=node.name))
+            '''
+                CREATE DATABASE test;
+    
+                CREATE TABLE test.test_table(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            '''.format(shard=shard, replica=node.name))
 
         node.query(
-        '''
-            CREATE DATABASE test1;
-
-            CREATE TABLE test1.test_table(date Date, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test1/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
-        '''.format(shard=shard, replica=node.name))
+            '''
+                CREATE DATABASE test1;
+    
+                CREATE TABLE test1.test_table(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test1/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            '''.format(shard=shard, replica=node.name))
 
         node.query(
-        '''
-            CREATE DATABASE test2;
-
-            CREATE TABLE test2.test_table(date Date, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test2/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
-        '''.format(shard=shard, replica=node.name))
-
+            '''
+                CREATE DATABASE test2;
+    
+                CREATE TABLE test2.test_table(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test2/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            '''.format(shard=shard, replica=node.name))
 
         node.query(
-        '''
-            CREATE DATABASE test3;
-
-            CREATE TABLE test3.test_table(date Date, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test3/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
-        '''.format(shard=shard, replica=node.name))
+            '''
+                CREATE DATABASE test3;
+    
+                CREATE TABLE test3.test_table(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test3/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            '''.format(shard=shard, replica=node.name))
 
         node.query(
-        '''
-            CREATE DATABASE test4;
+            '''
+                CREATE DATABASE test4;
+    
+                CREATE TABLE test4.test_table(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test4/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            '''.format(shard=shard, replica=node.name))
 
-            CREATE TABLE test4.test_table(date Date, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test4/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
-        '''.format(shard=shard, replica=node.name))
 
 cluster = ClickHouseCluster(__file__)
 
@@ -71,6 +70,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_drop_replica(start_cluster):
     for i in range(100):
         node_1_1.query("INSERT INTO test.test_table VALUES (1, {})".format(i))
@@ -81,17 +81,25 @@ def test_drop_replica(start_cluster):
 
     zk = cluster.get_kazoo_client('zoo1')
     assert "can't drop local replica" in node_1_1.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1'")
-    assert "can't drop local replica" in node_1_1.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM DATABASE test")
-    assert "can't drop local replica" in node_1_1.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM TABLE test.test_table")
+    assert "can't drop local replica" in node_1_1.query_and_get_error(
+        "SYSTEM DROP REPLICA 'node_1_1' FROM DATABASE test")
+    assert "can't drop local replica" in node_1_1.query_and_get_error(
+        "SYSTEM DROP REPLICA 'node_1_1' FROM TABLE test.test_table")
     assert "it's active" in node_1_2.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1'")
     assert "it's active" in node_1_2.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM DATABASE test")
     assert "it's active" in node_1_2.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM TABLE test.test_table")
     assert "it's active" in \
-        node_1_3.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test/{shard}/replicated/test_table'".format(shard=1))
+           node_1_3.query_and_get_error(
+               "SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test/{shard}/replicated/test_table'".format(
+                   shard=1))
     assert "There is a local table" in \
-        node_1_2.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test/{shard}/replicated/test_table'".format(shard=1))
+           node_1_2.query_and_get_error(
+               "SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test/{shard}/replicated/test_table'".format(
+                   shard=1))
     assert "There is a local table" in \
-        node_1_1.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test/{shard}/replicated/test_table'".format(shard=1))
+           node_1_1.query_and_get_error(
+               "SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test/{shard}/replicated/test_table'".format(
+                   shard=1))
     assert "does not look like a table path" in \
            node_1_3.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test'")
 
@@ -100,31 +108,48 @@ def test_drop_replica(start_cluster):
         pm.drop_instance_zk_connections(node_1_1)
         time.sleep(10)
 
-        assert "doesn't exist" in node_1_3.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM TABLE test.test_table")
+        assert "doesn't exist" in node_1_3.query_and_get_error(
+            "SYSTEM DROP REPLICA 'node_1_1' FROM TABLE test.test_table")
 
         assert "doesn't exist" in node_1_3.query_and_get_error("SYSTEM DROP REPLICA 'node_1_1' FROM DATABASE test1")
 
         node_1_3.query("SYSTEM DROP REPLICA 'node_1_1'")
-        exists_replica_1_1 = zk.exists("/clickhouse/tables/test3/{shard}/replicated/test_table/replicas/{replica}".format(shard=1, replica='node_1_1'))
+        exists_replica_1_1 = zk.exists(
+            "/clickhouse/tables/test3/{shard}/replicated/test_table/replicas/{replica}".format(shard=1,
+                                                                                               replica='node_1_1'))
         assert (exists_replica_1_1 != None)
 
         ## If you want to drop a inactive/stale replicate table that does not have a local replica, you can following syntax(ZKPATH):
-        node_1_3.query("SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test2/{shard}/replicated/test_table'".format(shard=1))
-        exists_replica_1_1 = zk.exists("/clickhouse/tables/test2/{shard}/replicated/test_table/replicas/{replica}".format(shard=1, replica='node_1_1'))
+        node_1_3.query(
+            "SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test2/{shard}/replicated/test_table'".format(
+                shard=1))
+        exists_replica_1_1 = zk.exists(
+            "/clickhouse/tables/test2/{shard}/replicated/test_table/replicas/{replica}".format(shard=1,
+                                                                                               replica='node_1_1'))
         assert (exists_replica_1_1 == None)
 
         node_1_2.query("SYSTEM DROP REPLICA 'node_1_1' FROM TABLE test.test_table")
-        exists_replica_1_1 = zk.exists("/clickhouse/tables/test/{shard}/replicated/test_table/replicas/{replica}".format(shard=1, replica='node_1_1'))
+        exists_replica_1_1 = zk.exists(
+            "/clickhouse/tables/test/{shard}/replicated/test_table/replicas/{replica}".format(shard=1,
+                                                                                              replica='node_1_1'))
         assert (exists_replica_1_1 == None)
 
         node_1_2.query("SYSTEM DROP REPLICA 'node_1_1' FROM DATABASE test1")
-        exists_replica_1_1 = zk.exists("/clickhouse/tables/test1/{shard}/replicated/test_table/replicas/{replica}".format(shard=1, replica='node_1_1'))
+        exists_replica_1_1 = zk.exists(
+            "/clickhouse/tables/test1/{shard}/replicated/test_table/replicas/{replica}".format(shard=1,
+                                                                                               replica='node_1_1'))
         assert (exists_replica_1_1 == None)
 
-        node_1_3.query("SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test3/{shard}/replicated/test_table'".format(shard=1))
-        exists_replica_1_1 = zk.exists("/clickhouse/tables/test3/{shard}/replicated/test_table/replicas/{replica}".format(shard=1, replica='node_1_1'))
+        node_1_3.query(
+            "SYSTEM DROP REPLICA 'node_1_1' FROM ZKPATH '/clickhouse/tables/test3/{shard}/replicated/test_table'".format(
+                shard=1))
+        exists_replica_1_1 = zk.exists(
+            "/clickhouse/tables/test3/{shard}/replicated/test_table/replicas/{replica}".format(shard=1,
+                                                                                               replica='node_1_1'))
         assert (exists_replica_1_1 == None)
 
         node_1_2.query("SYSTEM DROP REPLICA 'node_1_1'")
-        exists_replica_1_1 = zk.exists("/clickhouse/tables/test4/{shard}/replicated/test_table/replicas/{replica}".format(shard=1, replica='node_1_1'))
+        exists_replica_1_1 = zk.exists(
+            "/clickhouse/tables/test4/{shard}/replicated/test_table/replicas/{replica}".format(shard=1,
+                                                                                               replica='node_1_1'))
         assert (exists_replica_1_1 == None)
diff --git a/tests/integration/test_enabling_access_management/test.py b/tests/integration/test_enabling_access_management/test.py
index 4a6ad59f0bb..e93a643cd16 100644
--- a/tests/integration/test_enabling_access_management/test.py
+++ b/tests/integration/test_enabling_access_management/test.py
@@ -4,6 +4,7 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance', user_configs=["configs/users.d/extra_users.xml"])
 
+
 @pytest.fixture(scope="module", autouse=True)
 def started_cluster():
     try:
diff --git a/tests/integration/test_extreme_deduplication/test.py b/tests/integration/test_extreme_deduplication/test.py
index a7e6f10c1f6..d0d4b83d10f 100644
--- a/tests/integration/test_extreme_deduplication/test.py
+++ b/tests/integration/test_extreme_deduplication/test.py
@@ -1,21 +1,22 @@
 import time
-from contextlib import contextmanager
 
 import pytest
-
-from helpers.cluster import ClickHouseCluster
-from helpers.network import PartitionManager
-from helpers.test_tools import TSV
 from helpers.client import CommandRequest
 from helpers.client import QueryTimeoutExceedException
-
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import TSV
 
 cluster = ClickHouseCluster(__file__)
 
-node1 = cluster.add_instance('node1', main_configs=["configs/conf.d/merge_tree.xml", "configs/conf.d/remote_servers.xml"], with_zookeeper=True, macros={"layer": 0, "shard": 0, "replica": 1})
-node2 = cluster.add_instance('node2', main_configs=["configs/conf.d/merge_tree.xml", "configs/conf.d/remote_servers.xml"], with_zookeeper=True, macros={"layer": 0, "shard": 0, "replica": 2})
+node1 = cluster.add_instance('node1',
+                             main_configs=["configs/conf.d/merge_tree.xml", "configs/conf.d/remote_servers.xml"],
+                             with_zookeeper=True, macros={"layer": 0, "shard": 0, "replica": 1})
+node2 = cluster.add_instance('node2',
+                             main_configs=["configs/conf.d/merge_tree.xml", "configs/conf.d/remote_servers.xml"],
+                             with_zookeeper=True, macros={"layer": 0, "shard": 0, "replica": 2})
 nodes = [node1, node2]
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -36,15 +37,18 @@ def test_deduplication_window_in_seconds(started_cluster):
 
     node.query("INSERT INTO simple VALUES (0, 0)")
     time.sleep(1)
-    node.query("INSERT INTO simple VALUES (0, 0)") # deduplication works here
+    node.query("INSERT INTO simple VALUES (0, 0)")  # deduplication works here
     node.query("INSERT INTO simple VALUES (0, 1)")
     assert TSV(node.query("SELECT count() FROM simple")) == TSV("2\n")
 
     # wait clean thread
     time.sleep(2)
 
-    assert TSV.toMat(node.query("SELECT count() FROM system.zookeeper WHERE path='/clickhouse/tables/0/simple/blocks'"))[0][0] == "1"
-    node.query("INSERT INTO simple VALUES (0, 0)") # deduplication doesn't works here, the first hash node was deleted
+    assert \
+        TSV.toMat(node.query("SELECT count() FROM system.zookeeper WHERE path='/clickhouse/tables/0/simple/blocks'"))[
+            0][
+            0] == "1"
+    node.query("INSERT INTO simple VALUES (0, 0)")  # deduplication doesn't works here, the first hash node was deleted
     assert TSV.toMat(node.query("SELECT count() FROM simple"))[0][0] == "3"
 
     node1.query("""DROP TABLE simple ON CLUSTER test_cluster""")
diff --git a/tests/integration/test_fetch_partition_from_auxiliary_zookeeper/test.py b/tests/integration/test_fetch_partition_from_auxiliary_zookeeper/test.py
index f3ea2d4f152..9ad56d4fb17 100644
--- a/tests/integration/test_fetch_partition_from_auxiliary_zookeeper/test.py
+++ b/tests/integration/test_fetch_partition_from_auxiliary_zookeeper/test.py
@@ -1,15 +1,13 @@
 from __future__ import print_function
-from helpers.cluster import ClickHouseCluster
-from helpers.client import QueryRuntimeException
-import helpers
-import pytest
 
+import pytest
+from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance("node", main_configs=["configs/zookeeper_config.xml"], with_zookeeper=True)
 
 
-
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
diff --git a/tests/integration/test_filesystem_layout/test.py b/tests/integration/test_filesystem_layout/test.py
index 83389b3d9bd..93c8d3f7033 100644
--- a/tests/integration/test_filesystem_layout/test.py
+++ b/tests/integration/test_filesystem_layout/test.py
@@ -25,4 +25,5 @@ def test_file_path_escaping(started_cluster):
     node.query('''ALTER TABLE test.`T.a_b,l-e!` FREEZE;''')
 
     node.exec_in_container(["bash", "-c", "test -f /var/lib/clickhouse/data/test/T%2Ea_b%2Cl%2De%21/1_1_1_0/%7EId.bin"])
-    node.exec_in_container(["bash", "-c", "test -f /var/lib/clickhouse/shadow/1/data/test/T%2Ea_b%2Cl%2De%21/1_1_1_0/%7EId.bin"])
+    node.exec_in_container(
+        ["bash", "-c", "test -f /var/lib/clickhouse/shadow/1/data/test/T%2Ea_b%2Cl%2De%21/1_1_1_0/%7EId.bin"])
diff --git a/tests/integration/test_force_deduplication/test.py b/tests/integration/test_force_deduplication/test.py
index 5ad964ecb27..991e289f912 100644
--- a/tests/integration/test_force_deduplication/test.py
+++ b/tests/integration/test_force_deduplication/test.py
@@ -2,14 +2,14 @@
 # pylint: disable=redefined-outer-name
 
 import pytest
-
-from helpers.cluster import ClickHouseCluster
 from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 
 node = cluster.add_instance('node', with_zookeeper=True)
 
+
 @pytest.fixture(scope='module')
 def start_cluster():
     try:
@@ -19,6 +19,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def get_counts():
     src = int(node.query("SELECT count() FROM test"))
     a = int(node.query("SELECT count() FROM test_mv_a"))
@@ -69,7 +70,7 @@ def test_basic(start_cluster):
     )
     src, a, b, c = get_counts()
     assert src == 11
-    assert a == old_a + 10    # first insert could be succesfull with disabled dedup
+    assert a == old_a + 10  # first insert could be succesfull with disabled dedup
     assert b == 11
     assert c == old_c + 10
 
@@ -81,7 +82,7 @@ def test_basic(start_cluster):
             INSERT INTO test SELECT number FROM numbers(100,10);
             '''
         )
-        
+
     node.query(
         '''
         SET deduplicate_blocks_in_dependent_materialized_views = 1;
@@ -94,5 +95,3 @@ def test_basic(start_cluster):
     assert a == old_a + 20
     assert b == 21
     assert c == old_c + 20
-
-
diff --git a/tests/integration/test_format_avro_confluent/test.py b/tests/integration/test_format_avro_confluent/test.py
index a93b5585f8d..67d15305333 100644
--- a/tests/integration/test_format_avro_confluent/test.py
+++ b/tests/integration/test_format_avro_confluent/test.py
@@ -1,20 +1,15 @@
-import json
-import logging
 import io
-
-import pytest
-
-from helpers.cluster import ClickHouseCluster, ClickHouseInstance
-
-import helpers.client
+import logging
 
 import avro.schema
-from confluent.schemaregistry.client import CachedSchemaRegistryClient
+import pytest
 from confluent.schemaregistry.serializers import MessageSerializer
+from helpers.cluster import ClickHouseCluster, ClickHouseInstance
 
 logging.getLogger().setLevel(logging.INFO)
 logging.getLogger().addHandler(logging.StreamHandler())
 
+
 @pytest.fixture(scope="module")
 def cluster():
     try:
@@ -42,7 +37,6 @@ def run_query(instance, query, data=None, settings=None):
     return result
 
 
-
 def test_select(cluster):
     # type: (ClickHouseCluster) -> None
 
@@ -55,7 +49,7 @@ def test_select(cluster):
         'fields': [
             {
                 'name': 'value',
-                'type': 'long' 
+                'type': 'long'
             }
         ]
     })
@@ -73,7 +67,7 @@ def test_select(cluster):
         cluster.schema_registry_host,
         cluster.schema_registry_port
     )
-    
+
     run_query(instance, "create table avro_data(value Int64) engine = Memory()")
     settings = {'format_avro_schema_registry_url': schema_registry_url}
     run_query(instance, "insert into avro_data format AvroConfluent", data, settings)
diff --git a/tests/integration/test_format_schema_on_server/test.py b/tests/integration/test_format_schema_on_server/test.py
index 9d0f6948aef..3b53a897dc0 100644
--- a/tests/integration/test_format_schema_on_server/test.py
+++ b/tests/integration/test_format_schema_on_server/test.py
@@ -36,5 +36,6 @@ def test_protobuf_format_input(started_cluster):
 def test_protobuf_format_output(started_cluster):
     create_simple_table()
     instance.query("INSERT INTO test.simple VALUES (1, 'abc'), (2, 'def')");
-    assert instance.http_query("SELECT * FROM test.simple FORMAT Protobuf SETTINGS format_schema='simple:KeyValuePair'") == \
+    assert instance.http_query(
+        "SELECT * FROM test.simple FORMAT Protobuf SETTINGS format_schema='simple:KeyValuePair'") == \
            "\x07\x08\x01\x12\x03abc\x07\x08\x02\x12\x03def"
diff --git a/tests/integration/test_freeze_table/test.py b/tests/integration/test_freeze_table/test.py
index ab1af3f371e..4d4aa22d4e2 100644
--- a/tests/integration/test_freeze_table/test.py
+++ b/tests/integration/test_freeze_table/test.py
@@ -39,7 +39,7 @@ def test_freeze_table(started_cluster):
         '''))
     assert 11 == len(freeze_result)
     path_col_ix = freeze_result[0].index('part_backup_path')
-    for row in freeze_result[1:]: # skip header
+    for row in freeze_result[1:]:  # skip header
         part_backup_path = row[path_col_ix]
         node.exec_in_container(
             ["bash", "-c", "test -d {}".format(part_backup_path)]
@@ -55,7 +55,7 @@ def test_freeze_table(started_cluster):
         '''))
     assert 2 == len(freeze_result)
     path_col_ix = freeze_result[0].index('part_backup_path')
-    for row in freeze_result[1:]: # skip header
+    for row in freeze_result[1:]:  # skip header
         part_backup_path = row[path_col_ix]
         assert 'test_01417_single_part' in part_backup_path
         node.exec_in_container(
diff --git a/tests/integration/test_globs_in_filepath/test.py b/tests/integration/test_globs_in_filepath/test.py
index c85c39a8838..7e534dd69bc 100644
--- a/tests/integration/test_globs_in_filepath/test.py
+++ b/tests/integration/test_globs_in_filepath/test.py
@@ -4,7 +4,8 @@ from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node')
-path_to_userfiles_from_defaut_config = "/var/lib/clickhouse/user_files/"   # should be the same as in config file
+path_to_userfiles_from_defaut_config = "/var/lib/clickhouse/user_files/"  # should be the same as in config file
+
 
 @pytest.fixture(scope="module")
 def start_cluster():
@@ -19,11 +20,13 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_strange_filenames(start_cluster):
     # 2 rows data
     some_data = "\t111.222\nData\t333.444"
 
-    node.exec_in_container(['bash', '-c', 'mkdir {}strange_names/'.format(path_to_userfiles_from_defaut_config)], privileged=True, user='root')
+    node.exec_in_container(['bash', '-c', 'mkdir {}strange_names/'.format(path_to_userfiles_from_defaut_config)],
+                           privileged=True, user='root')
 
     files = ["p.o.i.n.t.s",
              "b}{ra{ces",
@@ -31,7 +34,10 @@ def test_strange_filenames(start_cluster):
 
     # filename inside testing data for debug simplicity
     for filename in files:
-        node.exec_in_container(['bash', '-c', 'echo "{}{}" > {}strange_names/{}'.format(filename, some_data, path_to_userfiles_from_defaut_config, filename)], privileged=True, user='root')
+        node.exec_in_container(['bash', '-c', 'echo "{}{}" > {}strange_names/{}'.format(filename, some_data,
+                                                                                        path_to_userfiles_from_defaut_config,
+                                                                                        filename)], privileged=True,
+                               user='root')
 
     test_requests = [("p.o.??n.t.s", "2"),
                      ("p.o.*t.s", "2"),
@@ -47,6 +53,7 @@ def test_strange_filenames(start_cluster):
             select count(*) from file('{}strange_names/{}', 'TSV', 'text String, number Float64')
         '''.format(path_to_userfiles_from_defaut_config, pattern)) == '{}\n'.format(value)
 
+
 def test_linear_structure(start_cluster):
     # 2 rows data
     some_data = "\t123.456\nData\t789.012"
@@ -58,7 +65,9 @@ def test_linear_structure(start_cluster):
 
     # filename inside testing data for debug simplicity
     for filename in files:
-        node.exec_in_container(['bash', '-c', 'echo "{}{}" > {}{}'.format(filename, some_data, path_to_userfiles_from_defaut_config, filename)], privileged=True, user='root')
+        node.exec_in_container(['bash', '-c',
+                                'echo "{}{}" > {}{}'.format(filename, some_data, path_to_userfiles_from_defaut_config,
+                                                            filename)], privileged=True, user='root')
 
     test_requests = [("file{0..9}", "10"),
                      ("file?", "10"),
@@ -81,6 +90,7 @@ def test_linear_structure(start_cluster):
             select count(*) from file('{}{}', 'TSV', 'text String, number Float64')
         '''.format(path_to_userfiles_from_defaut_config, pattern)) == '{}\n'.format(value)
 
+
 def test_deep_structure(start_cluster):
     # 2 rows data
     some_data = "\t135.791\nData\t246.802"
@@ -92,7 +102,8 @@ def test_deep_structure(start_cluster):
             "we/need/", "we/need/to/", "we/need/to/go/", "we/need/to/go/deeper/"]
 
     for dir in dirs:
-        node.exec_in_container(['bash', '-c', 'mkdir {}{}'.format(path_to_userfiles_from_defaut_config, dir)], privileged=True, user='root')
+        node.exec_in_container(['bash', '-c', 'mkdir {}{}'.format(path_to_userfiles_from_defaut_config, dir)],
+                               privileged=True, user='root')
 
     # all directories appeared in files must be listed in dirs
     files = []
@@ -102,13 +113,15 @@ def test_deep_structure(start_cluster):
                 files.append("directory1/big_dir/file" + str(i) + str(j) + str(k))
 
     for dir in dirs:
-        files.append(dir+"file")
+        files.append(dir + "file")
 
     # filename inside testing data for debug simplicity
     for filename in files:
-        node.exec_in_container(['bash', '-c', 'echo "{}{}" > {}{}'.format(filename, some_data, path_to_userfiles_from_defaut_config, filename)], privileged=True, user='root')
+        node.exec_in_container(['bash', '-c',
+                                'echo "{}{}" > {}{}'.format(filename, some_data, path_to_userfiles_from_defaut_config,
+                                                            filename)], privileged=True, user='root')
 
-    test_requests = [ ("directory{1..5}/big_dir/*", "2002"), ("directory{0..6}/big_dir/*{0..9}{0..9}{0..9}", "2000"),
+    test_requests = [("directory{1..5}/big_dir/*", "2002"), ("directory{0..6}/big_dir/*{0..9}{0..9}{0..9}", "2000"),
                      ("?", "0"),
                      ("directory{0..5}/dir{1..3}/file", "10"), ("directory{0..5}/dir?/file", "10"),
                      ("we/need/to/go/deeper/file", "2"), ("*/*/*/*/*/*", "2"), ("we/need/??/go/deeper/*?*?*?*?*", "2")]
@@ -121,14 +134,17 @@ def test_deep_structure(start_cluster):
             select count(*) from file('{}{}', 'TSV', 'text String, number Float64')
         '''.format(path_to_userfiles_from_defaut_config, pattern)) == '{}\n'.format(value)
 
+
 def test_table_function_and_virtual_columns(start_cluster):
     node.exec_in_container(['bash', '-c', 'mkdir -p {}some/path/to/'.format(path_to_userfiles_from_defaut_config)])
     node.exec_in_container(['bash', '-c', 'touch {}some/path/to/data.CSV'.format(path_to_userfiles_from_defaut_config)])
-    node.query("insert into table function file('some/path/to/data.CSV', CSV, 'n UInt8, s String') select number, concat('str_', toString(number)) from numbers(100000)")
-    assert node.query("select count() from file('some/path/to/data.CSV', CSV, 'n UInt8, s String')").rstrip() == '100000'
+    node.query(
+        "insert into table function file('some/path/to/data.CSV', CSV, 'n UInt8, s String') select number, concat('str_', toString(number)) from numbers(100000)")
+    assert node.query(
+        "select count() from file('some/path/to/data.CSV', CSV, 'n UInt8, s String')").rstrip() == '100000'
     node.query("insert into table function file('nonexist.csv', 'CSV', 'val1 UInt32') values (1)")
-    assert node.query("select * from file('nonexist.csv', 'CSV', 'val1 UInt32')").rstrip()== '1'
+    assert node.query("select * from file('nonexist.csv', 'CSV', 'val1 UInt32')").rstrip() == '1'
     assert "nonexist.csv" in node.query("select _path from file('nonexis?.csv', 'CSV', 'val1 UInt32')").rstrip()
     assert "nonexist.csv" in node.query("select _path from file('nonexist.csv', 'CSV', 'val1 UInt32')").rstrip()
     assert "nonexist.csv" == node.query("select _file from file('nonexis?.csv', 'CSV', 'val1 UInt32')").rstrip()
-    assert "nonexist.csv" == node.query("select _file from file('nonexist.csv', 'CSV', 'val1 UInt32')").rstrip()
\ No newline at end of file
+    assert "nonexist.csv" == node.query("select _file from file('nonexist.csv', 'CSV', 'val1 UInt32')").rstrip()
diff --git a/tests/integration/test_grant_and_revoke/test.py b/tests/integration/test_grant_and_revoke/test.py
index 1557e81bce8..073578edaa5 100644
--- a/tests/integration/test_grant_and_revoke/test.py
+++ b/tests/integration/test_grant_and_revoke/test.py
@@ -1,7 +1,6 @@
 import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
-import re
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance')
@@ -11,11 +10,11 @@ instance = cluster.add_instance('instance')
 def start_cluster():
     try:
         cluster.start()
-        
+
         instance.query("CREATE DATABASE test")
         instance.query("CREATE TABLE test.table(x UInt32, y UInt32) ENGINE = MergeTree ORDER BY tuple()")
         instance.query("INSERT INTO test.table VALUES (1,5), (2,10)")
-        
+
         yield cluster
 
     finally:
@@ -34,7 +33,7 @@ def cleanup_after_test():
 def test_smoke():
     instance.query("CREATE USER A")
     assert "Not enough privileges" in instance.query_and_get_error("SELECT * FROM test.table", user='A')
-    
+
     instance.query('GRANT SELECT ON test.table TO A')
     assert instance.query("SELECT * FROM test.table", user='A') == "1\t5\n2\t10\n"
 
@@ -49,7 +48,7 @@ def test_grant_option():
     instance.query('GRANT SELECT ON test.table TO A')
     assert instance.query("SELECT * FROM test.table", user='A') == "1\t5\n2\t10\n"
     assert "Not enough privileges" in instance.query_and_get_error("GRANT SELECT ON test.table TO B", user='A')
-    
+
     instance.query('GRANT SELECT ON test.table TO A WITH GRANT OPTION')
     instance.query("GRANT SELECT ON test.table TO B", user='A')
     assert instance.query("SELECT * FROM test.table", user='B') == "1\t5\n2\t10\n"
@@ -60,7 +59,7 @@ def test_grant_option():
 def test_revoke_requires_grant_option():
     instance.query("CREATE USER A")
     instance.query("CREATE USER B")
-    
+
     instance.query("GRANT SELECT ON test.table TO B")
     assert instance.query("SHOW GRANTS FOR B") == "GRANT SELECT ON test.table TO B\n"
 
@@ -111,7 +110,8 @@ def test_grant_all_on_table():
     instance.query("CREATE USER A, B")
     instance.query("GRANT ALL ON test.table TO A WITH GRANT OPTION")
     instance.query("GRANT ALL ON test.table TO B", user='A')
-    assert instance.query("SHOW GRANTS FOR B") == "GRANT SHOW TABLES, SHOW COLUMNS, SHOW DICTIONARIES, SELECT, INSERT, ALTER, CREATE TABLE, CREATE VIEW, CREATE DICTIONARY, DROP TABLE, DROP VIEW, DROP DICTIONARY, TRUNCATE, OPTIMIZE, SYSTEM MERGES, SYSTEM TTL MERGES, SYSTEM FETCHES, SYSTEM MOVES, SYSTEM SENDS, SYSTEM REPLICATION QUEUES, SYSTEM DROP REPLICA, SYSTEM SYNC REPLICA, SYSTEM RESTART REPLICA, SYSTEM FLUSH DISTRIBUTED, dictGet ON test.table TO B\n"
+    assert instance.query(
+        "SHOW GRANTS FOR B") == "GRANT SHOW TABLES, SHOW COLUMNS, SHOW DICTIONARIES, SELECT, INSERT, ALTER, CREATE TABLE, CREATE VIEW, CREATE DICTIONARY, DROP TABLE, DROP VIEW, DROP DICTIONARY, TRUNCATE, OPTIMIZE, SYSTEM MERGES, SYSTEM TTL MERGES, SYSTEM FETCHES, SYSTEM MOVES, SYSTEM SENDS, SYSTEM REPLICATION QUEUES, SYSTEM DROP REPLICA, SYSTEM SYNC REPLICA, SYSTEM RESTART REPLICA, SYSTEM FLUSH DISTRIBUTED, dictGet ON test.table TO B\n"
     instance.query("REVOKE ALL ON test.table FROM B", user='A')
     assert instance.query("SHOW GRANTS FOR B") == ""
 
@@ -120,36 +120,42 @@ def test_implicit_show_grants():
     instance.query("CREATE USER A")
     assert instance.query("select count() FROM system.databases WHERE name='test'", user="A") == "0\n"
     assert instance.query("select count() FROM system.tables WHERE database='test' AND name='table'", user="A") == "0\n"
-    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'", user="A") == "0\n"
+    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'",
+                          user="A") == "0\n"
 
     instance.query("GRANT SELECT(x) ON test.table TO A")
     assert instance.query("SHOW GRANTS FOR A") == "GRANT SELECT(x) ON test.table TO A\n"
     assert instance.query("select count() FROM system.databases WHERE name='test'", user="A") == "1\n"
     assert instance.query("select count() FROM system.tables WHERE database='test' AND name='table'", user="A") == "1\n"
-    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'", user="A") == "1\n"
+    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'",
+                          user="A") == "1\n"
 
     instance.query("GRANT SELECT ON test.table TO A")
     assert instance.query("SHOW GRANTS FOR A") == "GRANT SELECT ON test.table TO A\n"
     assert instance.query("select count() FROM system.databases WHERE name='test'", user="A") == "1\n"
     assert instance.query("select count() FROM system.tables WHERE database='test' AND name='table'", user="A") == "1\n"
-    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'", user="A") == "2\n"
+    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'",
+                          user="A") == "2\n"
 
     instance.query("GRANT SELECT ON test.* TO A")
     assert instance.query("SHOW GRANTS FOR A") == "GRANT SELECT ON test.* TO A\n"
     assert instance.query("select count() FROM system.databases WHERE name='test'", user="A") == "1\n"
     assert instance.query("select count() FROM system.tables WHERE database='test' AND name='table'", user="A") == "1\n"
-    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'", user="A") == "2\n"
+    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'",
+                          user="A") == "2\n"
 
     instance.query("GRANT SELECT ON *.* TO A")
     assert instance.query("SHOW GRANTS FOR A") == "GRANT SELECT ON *.* TO A\n"
     assert instance.query("select count() FROM system.databases WHERE name='test'", user="A") == "1\n"
     assert instance.query("select count() FROM system.tables WHERE database='test' AND name='table'", user="A") == "1\n"
-    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'", user="A") == "2\n"
+    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'",
+                          user="A") == "2\n"
 
     instance.query("REVOKE ALL ON *.* FROM A")
     assert instance.query("select count() FROM system.databases WHERE name='test'", user="A") == "0\n"
     assert instance.query("select count() FROM system.tables WHERE database='test' AND name='table'", user="A") == "0\n"
-    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'", user="A") == "0\n"
+    assert instance.query("select count() FROM system.columns WHERE database='test' AND table='table'",
+                          user="A") == "0\n"
 
 
 def test_implicit_create_view_grant():
@@ -184,46 +190,53 @@ def test_introspection():
     instance.query('GRANT SELECT ON test.table TO A')
     instance.query('GRANT CREATE ON *.* TO B WITH GRANT OPTION')
 
-    assert instance.query("SHOW USERS") == TSV([ "A", "B", "default" ])
-    assert instance.query("SHOW CREATE USERS A") == TSV([ "CREATE USER A" ])
-    assert instance.query("SHOW CREATE USERS B") == TSV([ "CREATE USER B" ])
-    assert instance.query("SHOW CREATE USERS A,B") == TSV([ "CREATE USER A", "CREATE USER B" ])
-    assert instance.query("SHOW CREATE USERS") == TSV([ "CREATE USER A", "CREATE USER B", "CREATE USER default IDENTIFIED WITH plaintext_password SETTINGS PROFILE default" ])
+    assert instance.query("SHOW USERS") == TSV(["A", "B", "default"])
+    assert instance.query("SHOW CREATE USERS A") == TSV(["CREATE USER A"])
+    assert instance.query("SHOW CREATE USERS B") == TSV(["CREATE USER B"])
+    assert instance.query("SHOW CREATE USERS A,B") == TSV(["CREATE USER A", "CREATE USER B"])
+    assert instance.query("SHOW CREATE USERS") == TSV(["CREATE USER A", "CREATE USER B",
+                                                       "CREATE USER default IDENTIFIED WITH plaintext_password SETTINGS PROFILE default"])
 
-    assert instance.query("SHOW GRANTS FOR A") == TSV([ "GRANT SELECT ON test.table TO A" ])
-    assert instance.query("SHOW GRANTS FOR B") == TSV([ "GRANT CREATE ON *.* TO B WITH GRANT OPTION" ])
-    assert instance.query("SHOW GRANTS FOR A,B") == TSV([ "GRANT SELECT ON test.table TO A", "GRANT CREATE ON *.* TO B WITH GRANT OPTION" ])
-    assert instance.query("SHOW GRANTS FOR B,A") == TSV([ "GRANT SELECT ON test.table TO A", "GRANT CREATE ON *.* TO B WITH GRANT OPTION" ])
-    assert instance.query("SHOW GRANTS FOR ALL") == TSV([ "GRANT SELECT ON test.table TO A", "GRANT CREATE ON *.* TO B WITH GRANT OPTION", "GRANT ALL ON *.* TO default WITH GRANT OPTION" ])
+    assert instance.query("SHOW GRANTS FOR A") == TSV(["GRANT SELECT ON test.table TO A"])
+    assert instance.query("SHOW GRANTS FOR B") == TSV(["GRANT CREATE ON *.* TO B WITH GRANT OPTION"])
+    assert instance.query("SHOW GRANTS FOR A,B") == TSV(
+        ["GRANT SELECT ON test.table TO A", "GRANT CREATE ON *.* TO B WITH GRANT OPTION"])
+    assert instance.query("SHOW GRANTS FOR B,A") == TSV(
+        ["GRANT SELECT ON test.table TO A", "GRANT CREATE ON *.* TO B WITH GRANT OPTION"])
+    assert instance.query("SHOW GRANTS FOR ALL") == TSV(
+        ["GRANT SELECT ON test.table TO A", "GRANT CREATE ON *.* TO B WITH GRANT OPTION",
+         "GRANT ALL ON *.* TO default WITH GRANT OPTION"])
 
-    assert instance.query("SHOW GRANTS", user='A') == TSV([ "GRANT SELECT ON test.table TO A" ])
-    assert instance.query("SHOW GRANTS", user='B') == TSV([ "GRANT CREATE ON *.* TO B WITH GRANT OPTION" ])
+    assert instance.query("SHOW GRANTS", user='A') == TSV(["GRANT SELECT ON test.table TO A"])
+    assert instance.query("SHOW GRANTS", user='B') == TSV(["GRANT CREATE ON *.* TO B WITH GRANT OPTION"])
 
-    expected_access1 = "CREATE USER A\n"\
-                       "CREATE USER B\n"\
+    expected_access1 = "CREATE USER A\n" \
+                       "CREATE USER B\n" \
                        "CREATE USER default IDENTIFIED WITH plaintext_password SETTINGS PROFILE default"
-    expected_access2 = "GRANT SELECT ON test.table TO A\n"\
-                       "GRANT CREATE ON *.* TO B WITH GRANT OPTION\n"\
+    expected_access2 = "GRANT SELECT ON test.table TO A\n" \
+                       "GRANT CREATE ON *.* TO B WITH GRANT OPTION\n" \
                        "GRANT ALL ON *.* TO default WITH GRANT OPTION\n"
     assert expected_access1 in instance.query("SHOW ACCESS")
     assert expected_access2 in instance.query("SHOW ACCESS")
 
-    assert instance.query("SELECT name, storage, auth_type, auth_params, host_ip, host_names, host_names_regexp, host_names_like, default_roles_all, default_roles_list, default_roles_except from system.users WHERE name IN ('A', 'B') ORDER BY name") ==\
-           TSV([[ "A", "local directory", "no_password", "{}", "['::/0']", "[]", "[]", "[]", 1, "[]", "[]" ],
-                [ "B", "local directory", "no_password", "{}", "['::/0']", "[]", "[]", "[]", 1, "[]", "[]" ]])
-    
-    assert instance.query("SELECT * from system.grants WHERE user_name IN ('A', 'B') ORDER BY user_name, access_type, grant_option") ==\
-           TSV([[ "A",  "\N", "SELECT", "test", "table", "\N", 0, 0 ],
-                [ "B",  "\N", "CREATE", "\N",   "\N",    "\N", 0, 1 ]])
+    assert instance.query(
+        "SELECT name, storage, auth_type, auth_params, host_ip, host_names, host_names_regexp, host_names_like, default_roles_all, default_roles_list, default_roles_except from system.users WHERE name IN ('A', 'B') ORDER BY name") == \
+           TSV([["A", "local directory", "no_password", "{}", "['::/0']", "[]", "[]", "[]", 1, "[]", "[]"],
+                ["B", "local directory", "no_password", "{}", "['::/0']", "[]", "[]", "[]", 1, "[]", "[]"]])
+
+    assert instance.query(
+        "SELECT * from system.grants WHERE user_name IN ('A', 'B') ORDER BY user_name, access_type, grant_option") == \
+           TSV([["A", "\N", "SELECT", "test", "table", "\N", 0, 0],
+                ["B", "\N", "CREATE", "\N", "\N", "\N", 0, 1]])
 
 
 def test_current_database():
     instance.query("CREATE USER A")
     instance.query("GRANT SELECT ON table TO A", database="test")
-    
-    assert instance.query("SHOW GRANTS FOR A") == TSV([ "GRANT SELECT ON test.table TO A" ])
-    assert instance.query("SHOW GRANTS FOR A", database="test") == TSV([ "GRANT SELECT ON test.table TO A" ])
-    
+
+    assert instance.query("SHOW GRANTS FOR A") == TSV(["GRANT SELECT ON test.table TO A"])
+    assert instance.query("SHOW GRANTS FOR A", database="test") == TSV(["GRANT SELECT ON test.table TO A"])
+
     assert instance.query("SELECT * FROM test.table", user='A') == "1\t5\n2\t10\n"
     assert instance.query("SELECT * FROM table", user='A', database='test') == "1\t5\n2\t10\n"
 
diff --git a/tests/integration/test_graphite_merge_tree/test.py b/tests/integration/test_graphite_merge_tree/test.py
index 509fbac97d0..319fdb816ff 100644
--- a/tests/integration/test_graphite_merge_tree/test.py
+++ b/tests/integration/test_graphite_merge_tree/test.py
@@ -1,12 +1,11 @@
+import datetime
 import os.path as p
 import time
-import datetime
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
-
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance',
                                 main_configs=['configs/graphite_rollup.xml'])
@@ -317,20 +316,20 @@ def test_combined_rules(graphite_table):
     expected_unmerged = ''
     for i in range(384):
         to_insert += "('five_min.count', {v}, {t}, toDate({t}), 1), ".format(
-            v=1, t=1487970000+(i*300)
+            v=1, t=1487970000 + (i * 300)
         )
         to_insert += "('five_min.max', {v}, {t}, toDate({t}), 1), ".format(
-            v=i, t=1487970000+(i*300)
+            v=i, t=1487970000 + (i * 300)
         )
         expected_unmerged += ("five_min.count\t{v1}\t{t}\n"
                               "five_min.max\t{v2}\t{t}\n").format(
-                                  v1=1, v2=i,
-                                  t=1487970000+(i*300)
-                              )
+            v1=1, v2=i,
+            t=1487970000 + (i * 300)
+        )
 
     q(to_insert)
     assert TSV(q('SELECT metric, value, timestamp FROM test.graphite'
-               ' ORDER BY (timestamp, metric)')) == TSV(expected_unmerged)
+                 ' ORDER BY (timestamp, metric)')) == TSV(expected_unmerged)
 
     q('OPTIMIZE TABLE test.graphite PARTITION 201702 FINAL')
     expected_merged = '''
@@ -370,16 +369,16 @@ CREATE TABLE test.graphite
     expected_unmerged = ''
     for i in range(100):
         to_insert += "('top_level.count', {v}, {t}, toDate({t}), 1), ".format(
-            v=1, t=1487970000+(i*60)
+            v=1, t=1487970000 + (i * 60)
         )
         to_insert += "('top_level.max', {v}, {t}, toDate({t}), 1), ".format(
-            v=i, t=1487970000+(i*60)
+            v=i, t=1487970000 + (i * 60)
         )
         expected_unmerged += ("top_level.count\t{v1}\t{t}\n"
                               "top_level.max\t{v2}\t{t}\n").format(
-                                  v1=1, v2=i,
-                                  t=1487970000+(i*60)
-                              )
+            v1=1, v2=i,
+            t=1487970000 + (i * 60)
+        )
 
     q(to_insert)
     assert TSV(q('SELECT metric, value, timestamp FROM test.graphite'
diff --git a/tests/integration/test_host_ip_change/test.py b/tests/integration/test_host_ip_change/test.py
index a2a38158dc4..951af699a5f 100644
--- a/tests/integration/test_host_ip_change/test.py
+++ b/tests/integration/test_host_ip_change/test.py
@@ -1,15 +1,12 @@
-import time
 import pytest
-
-import subprocess
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry
 from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
-
+from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
+
 def _fill_nodes(nodes, table_name):
     for node in nodes:
         node.query(
@@ -21,9 +18,12 @@ def _fill_nodes(nodes, table_name):
             '''.format(table_name, node.name)
         )
 
-node1 = cluster.add_instance('node1', main_configs=['configs/listen_host.xml'], with_zookeeper=True, ipv6_address='2001:3984:3989::1:1111')
+
+node1 = cluster.add_instance('node1', main_configs=['configs/listen_host.xml'], with_zookeeper=True,
+                             ipv6_address='2001:3984:3989::1:1111')
 node2 = cluster.add_instance('node2', main_configs=['configs/listen_host.xml', 'configs/dns_update_long.xml'],
-    with_zookeeper=True, ipv6_address='2001:3984:3989::1:1112')
+                             with_zookeeper=True, ipv6_address='2001:3984:3989::1:1112')
+
 
 @pytest.fixture(scope="module")
 def cluster_without_dns_cache_update():
@@ -41,6 +41,7 @@ def cluster_without_dns_cache_update():
         cluster.shutdown()
         pass
 
+
 # node1 is a source, node2 downloads data
 # node2 has long dns_cache_update_period, so dns cache update wouldn't work
 def test_ip_change_drop_dns_cache(cluster_without_dns_cache_update):
@@ -73,9 +74,11 @@ def test_ip_change_drop_dns_cache(cluster_without_dns_cache_update):
 
 
 node3 = cluster.add_instance('node3', main_configs=['configs/listen_host.xml'],
-    with_zookeeper=True, ipv6_address='2001:3984:3989::1:1113')
-node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml', 'configs/listen_host.xml', 'configs/dns_update_short.xml'],
-    with_zookeeper=True, ipv6_address='2001:3984:3989::1:1114')
+                             with_zookeeper=True, ipv6_address='2001:3984:3989::1:1113')
+node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml', 'configs/listen_host.xml',
+                                                    'configs/dns_update_short.xml'],
+                             with_zookeeper=True, ipv6_address='2001:3984:3989::1:1114')
+
 
 @pytest.fixture(scope="module")
 def cluster_with_dns_cache_update():
@@ -93,6 +96,7 @@ def cluster_with_dns_cache_update():
         cluster.shutdown()
         pass
 
+
 # node3 is a source, node4 downloads data
 # node4 has short dns_cache_update_period, so testing update of dns cache
 def test_ip_change_update_dns_cache(cluster_with_dns_cache_update):
@@ -107,7 +111,6 @@ def test_ip_change_update_dns_cache(cluster_with_dns_cache_update):
     # Put some data to source node3
     node3.query("INSERT INTO test_table_update VALUES ('2018-10-01', 5), ('2018-10-02', 6), ('2018-10-03', 7)")
 
-
     # Check that data is placed on node3
     assert node3.query("SELECT count(*) from test_table_update") == "6\n"
 
@@ -126,9 +129,12 @@ def test_ip_change_update_dns_cache(cluster_with_dns_cache_update):
     assert node3.query("SELECT count(*) from test_table_update") == "7\n"
     assert_eq_with_retry(node4, "SELECT count(*) from test_table_update", "7")
 
+
 def set_hosts(node, hosts):
     new_content = '\\n'.join(['127.0.0.1 localhost', '::1 localhost'] + hosts)
-    node.exec_in_container(['bash', '-c', 'echo -e "{}" > /etc/hosts'.format(new_content)], privileged=True, user='root')
+    node.exec_in_container(['bash', '-c', 'echo -e "{}" > /etc/hosts'.format(new_content)], privileged=True,
+                           user='root')
+
 
 def test_dns_cache_update(cluster_with_dns_cache_update):
     set_hosts(node4, ['127.255.255.255 lost_host'])
@@ -136,7 +142,8 @@ def test_dns_cache_update(cluster_with_dns_cache_update):
     with pytest.raises(QueryRuntimeException):
         node4.query("SELECT * FROM remote('lost_host', 'system', 'one')")
 
-    node4.query("CREATE TABLE distributed_lost_host (dummy UInt8) ENGINE = Distributed(lost_host_cluster, 'system', 'one')")
+    node4.query(
+        "CREATE TABLE distributed_lost_host (dummy UInt8) ENGINE = Distributed(lost_host_cluster, 'system', 'one')")
     with pytest.raises(QueryRuntimeException):
         node4.query("SELECT * FROM distributed_lost_host")
 
@@ -146,21 +153,26 @@ def test_dns_cache_update(cluster_with_dns_cache_update):
     assert_eq_with_retry(node4, "SELECT * FROM remote('lost_host', 'system', 'one')", "0")
     assert_eq_with_retry(node4, "SELECT * FROM distributed_lost_host", "0")
 
-    assert TSV(node4.query("SELECT DISTINCT host_name, host_address FROM system.clusters WHERE cluster='lost_host_cluster'")) == TSV("lost_host\t127.0.0.1\n")
+    assert TSV(node4.query(
+        "SELECT DISTINCT host_name, host_address FROM system.clusters WHERE cluster='lost_host_cluster'")) == TSV(
+        "lost_host\t127.0.0.1\n")
     assert TSV(node4.query("SELECT hostName()")) == TSV("node4")
 
+
 # Check SYSTEM DROP DNS CACHE on node5 and background cache update on node6
 node5 = cluster.add_instance('node5', main_configs=['configs/listen_host.xml', 'configs/dns_update_long.xml'],
                              user_configs=['configs/users_with_hostname.xml'], ipv6_address='2001:3984:3989::1:1115')
 node6 = cluster.add_instance('node6', main_configs=['configs/listen_host.xml', 'configs/dns_update_short.xml'],
                              user_configs=['configs/users_with_hostname.xml'], ipv6_address='2001:3984:3989::1:1116')
 
+
 @pytest.mark.parametrize("node", [node5, node6])
 def test_user_access_ip_change(cluster_with_dns_cache_update, node):
     node_name = node.name
     node_num = node.name[-1]
     # getaddrinfo(...) may hang for a log time without this options
-    node.exec_in_container(['bash', '-c', 'echo -e "options timeout:1\noptions attempts:2" >> /etc/resolv.conf'], privileged=True, user='root')
+    node.exec_in_container(['bash', '-c', 'echo -e "options timeout:1\noptions attempts:2" >> /etc/resolv.conf'],
+                           privileged=True, user='root')
 
     assert node3.query("SELECT * FROM remote('{}', 'system', 'one')".format(node_name)) == "0\n"
     assert node4.query("SELECT * FROM remote('{}', 'system', 'one')".format(node_name)) == "0\n"
@@ -180,8 +192,11 @@ def test_user_access_ip_change(cluster_with_dns_cache_update, node):
     retry_count = 60
     if node_name == 'node5':
         # client is not allowed to connect, so execute it directly in container to send query from localhost
-        node.exec_in_container(['bash', '-c', 'clickhouse client -q "SYSTEM DROP DNS CACHE"'], privileged=True, user='root')
+        node.exec_in_container(['bash', '-c', 'clickhouse client -q "SYSTEM DROP DNS CACHE"'], privileged=True,
+                               user='root')
         retry_count = 1
 
-    assert_eq_with_retry(node3, "SELECT * FROM remote('{}', 'system', 'one')".format(node_name), "0", retry_count=retry_count, sleep_time=1)
-    assert_eq_with_retry(node4, "SELECT * FROM remote('{}', 'system', 'one')".format(node_name), "0", retry_count=retry_count, sleep_time=1)
+    assert_eq_with_retry(node3, "SELECT * FROM remote('{}', 'system', 'one')".format(node_name), "0",
+                         retry_count=retry_count, sleep_time=1)
+    assert_eq_with_retry(node4, "SELECT * FROM remote('{}', 'system', 'one')".format(node_name), "0",
+                         retry_count=retry_count, sleep_time=1)
diff --git a/tests/integration/test_http_and_readonly/test.py b/tests/integration/test_http_and_readonly/test.py
index ea25b787a67..9929e34c9d2 100644
--- a/tests/integration/test_http_and_readonly/test.py
+++ b/tests/integration/test_http_and_readonly/test.py
@@ -16,5 +16,7 @@ def setup_nodes():
 
 
 def test_http_get_is_readonly():
-    assert "Cannot execute query in readonly mode" in instance.http_query_and_get_error("CREATE TABLE xxx (a Date) ENGINE = MergeTree(a, a, 256)")
-    assert "Cannot modify 'readonly' setting in readonly mode" in instance.http_query_and_get_error("CREATE TABLE xxx (a Date) ENGINE = MergeTree(a, a, 256)", params={"readonly": 0})
+    assert "Cannot execute query in readonly mode" in instance.http_query_and_get_error(
+        "CREATE TABLE xxx (a Date) ENGINE = MergeTree(a, a, 256)")
+    assert "Cannot modify 'readonly' setting in readonly mode" in instance.http_query_and_get_error(
+        "CREATE TABLE xxx (a Date) ENGINE = MergeTree(a, a, 256)", params={"readonly": 0})
diff --git a/tests/integration/test_http_handlers_config/test.py b/tests/integration/test_http_handlers_config/test.py
index 6b0ced11204..06602ba3ca3 100644
--- a/tests/integration/test_http_handlers_config/test.py
+++ b/tests/integration/test_http_handlers_config/test.py
@@ -1,6 +1,6 @@
+import contextlib
 import os
 import urllib
-import contextlib
 
 from helpers.cluster import ClickHouseCluster
 
@@ -20,101 +20,145 @@ class SimpleCluster:
 
 
 def test_dynamic_query_handler():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "dynamic_handler", "test_dynamic_handler")) as cluster:
+    with contextlib.closing(
+            SimpleCluster(ClickHouseCluster(__file__), "dynamic_handler", "test_dynamic_handler")) as cluster:
         test_query = urllib.quote_plus('SELECT * FROM system.settings WHERE name = \'max_threads\'')
 
         assert 404 == cluster.instance.http_request('?max_threads=1', method='GET', headers={'XXX': 'xxx'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_dynamic_handler_get?max_threads=1', method='POST', headers={'XXX': 'xxx'}).status_code
+        assert 404 == cluster.instance.http_request('test_dynamic_handler_get?max_threads=1', method='POST',
+                                                    headers={'XXX': 'xxx'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_dynamic_handler_get?max_threads=1', method='GET', headers={'XXX': 'bad'}).status_code
+        assert 404 == cluster.instance.http_request('test_dynamic_handler_get?max_threads=1', method='GET',
+                                                    headers={'XXX': 'bad'}).status_code
 
-        assert 400 == cluster.instance.http_request('test_dynamic_handler_get?max_threads=1', method='GET', headers={'XXX': 'xxx'}).status_code
+        assert 400 == cluster.instance.http_request('test_dynamic_handler_get?max_threads=1', method='GET',
+                                                    headers={'XXX': 'xxx'}).status_code
 
-        assert 200 == cluster.instance.http_request('test_dynamic_handler_get?max_threads=1&get_dynamic_handler_query=' + test_query,
-                method='GET', headers={'XXX': 'xxx'}).status_code
+        assert 200 == cluster.instance.http_request(
+            'test_dynamic_handler_get?max_threads=1&get_dynamic_handler_query=' + test_query,
+            method='GET', headers={'XXX': 'xxx'}).status_code
 
 
 def test_predefined_query_handler():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "predefined_handler", "test_predefined_handler")) as cluster:
+    with contextlib.closing(
+            SimpleCluster(ClickHouseCluster(__file__), "predefined_handler", "test_predefined_handler")) as cluster:
         assert 404 == cluster.instance.http_request('?max_threads=1', method='GET', headers={'XXX': 'xxx'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_predefined_handler_get?max_threads=1', method='GET', headers={'XXX': 'bad'}).status_code
+        assert 404 == cluster.instance.http_request('test_predefined_handler_get?max_threads=1', method='GET',
+                                                    headers={'XXX': 'bad'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_predefined_handler_get?max_threads=1', method='POST', headers={'XXX': 'xxx'}).status_code
+        assert 404 == cluster.instance.http_request('test_predefined_handler_get?max_threads=1', method='POST',
+                                                    headers={'XXX': 'xxx'}).status_code
 
-        assert 500 == cluster.instance.http_request('test_predefined_handler_get?max_threads=1', method='GET', headers={'XXX': 'xxx'}).status_code
+        assert 500 == cluster.instance.http_request('test_predefined_handler_get?max_threads=1', method='GET',
+                                                    headers={'XXX': 'xxx'}).status_code
 
-        assert 'max_threads\t1\n' == cluster.instance.http_request('test_predefined_handler_get?max_threads=1&setting_name=max_threads', method='GET', headers={'XXX': 'xxx'}).content
+        assert 'max_threads\t1\n' == cluster.instance.http_request(
+            'test_predefined_handler_get?max_threads=1&setting_name=max_threads', method='GET',
+            headers={'XXX': 'xxx'}).content
 
         assert 'max_threads\t1\nmax_alter_threads\t1\n' == cluster.instance.http_request(
-            'query_param_with_url/max_threads?max_threads=1&max_alter_threads=1', headers={'XXX': 'max_alter_threads'}).content
+            'query_param_with_url/max_threads?max_threads=1&max_alter_threads=1',
+            headers={'XXX': 'max_alter_threads'}).content
 
 
 def test_fixed_static_handler():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "static_handler", "test_static_handler")) as cluster:
+    with contextlib.closing(
+            SimpleCluster(ClickHouseCluster(__file__), "static_handler", "test_static_handler")) as cluster:
         assert 404 == cluster.instance.http_request('', method='GET', headers={'XXX': 'xxx'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_get_fixed_static_handler', method='GET', headers={'XXX': 'bad'}).status_code
+        assert 404 == cluster.instance.http_request('test_get_fixed_static_handler', method='GET',
+                                                    headers={'XXX': 'bad'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_get_fixed_static_handler', method='POST', headers={'XXX': 'xxx'}).status_code
+        assert 404 == cluster.instance.http_request('test_get_fixed_static_handler', method='POST',
+                                                    headers={'XXX': 'xxx'}).status_code
 
-        assert 402 == cluster.instance.http_request('test_get_fixed_static_handler', method='GET', headers={'XXX': 'xxx'}).status_code
-        assert 'text/html; charset=UTF-8' == cluster.instance.http_request('test_get_fixed_static_handler', method='GET', headers={'XXX': 'xxx'}).headers['Content-Type']
-        assert 'Test get static handler and fix content' == cluster.instance.http_request('test_get_fixed_static_handler', method='GET', headers={'XXX': 'xxx'}).content
+        assert 402 == cluster.instance.http_request('test_get_fixed_static_handler', method='GET',
+                                                    headers={'XXX': 'xxx'}).status_code
+        assert 'text/html; charset=UTF-8' == \
+               cluster.instance.http_request('test_get_fixed_static_handler', method='GET',
+                                             headers={'XXX': 'xxx'}).headers['Content-Type']
+        assert 'Test get static handler and fix content' == cluster.instance.http_request(
+            'test_get_fixed_static_handler', method='GET', headers={'XXX': 'xxx'}).content
 
 
 def test_config_static_handler():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "static_handler", "test_static_handler")) as cluster:
+    with contextlib.closing(
+            SimpleCluster(ClickHouseCluster(__file__), "static_handler", "test_static_handler")) as cluster:
         assert 404 == cluster.instance.http_request('', method='GET', headers={'XXX': 'xxx'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_get_config_static_handler', method='GET', headers={'XXX': 'bad'}).status_code
+        assert 404 == cluster.instance.http_request('test_get_config_static_handler', method='GET',
+                                                    headers={'XXX': 'bad'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_get_config_static_handler', method='POST', headers={'XXX': 'xxx'}).status_code
+        assert 404 == cluster.instance.http_request('test_get_config_static_handler', method='POST',
+                                                    headers={'XXX': 'xxx'}).status_code
 
         # check default status code
-        assert 200 == cluster.instance.http_request('test_get_config_static_handler', method='GET', headers={'XXX': 'xxx'}).status_code
-        assert 'text/plain; charset=UTF-8' == cluster.instance.http_request('test_get_config_static_handler', method='GET', headers={'XXX': 'xxx'}).headers['Content-Type']
-        assert 'Test get static handler and config content' == cluster.instance.http_request('test_get_config_static_handler', method='GET', headers={'XXX': 'xxx'}).content
+        assert 200 == cluster.instance.http_request('test_get_config_static_handler', method='GET',
+                                                    headers={'XXX': 'xxx'}).status_code
+        assert 'text/plain; charset=UTF-8' == \
+               cluster.instance.http_request('test_get_config_static_handler', method='GET',
+                                             headers={'XXX': 'xxx'}).headers['Content-Type']
+        assert 'Test get static handler and config content' == cluster.instance.http_request(
+            'test_get_config_static_handler', method='GET', headers={'XXX': 'xxx'}).content
 
 
 def test_absolute_path_static_handler():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "static_handler", "test_static_handler")) as cluster:
+    with contextlib.closing(
+            SimpleCluster(ClickHouseCluster(__file__), "static_handler", "test_static_handler")) as cluster:
         cluster.instance.exec_in_container(
-            ['bash', '-c', 'echo "<html><body>Absolute Path File</body></html>" > /var/lib/clickhouse/user_files/absolute_path_file.html'],
+            ['bash', '-c',
+             'echo "<html><body>Absolute Path File</body></html>" > /var/lib/clickhouse/user_files/absolute_path_file.html'],
             privileged=True, user='root')
 
         assert 404 == cluster.instance.http_request('', method='GET', headers={'XXX': 'xxx'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_get_absolute_path_static_handler', method='GET', headers={'XXX': 'bad'}).status_code
+        assert 404 == cluster.instance.http_request('test_get_absolute_path_static_handler', method='GET',
+                                                    headers={'XXX': 'bad'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_get_absolute_path_static_handler', method='POST', headers={'XXX': 'xxx'}).status_code
+        assert 404 == cluster.instance.http_request('test_get_absolute_path_static_handler', method='POST',
+                                                    headers={'XXX': 'xxx'}).status_code
 
         # check default status code
-        assert 200 == cluster.instance.http_request('test_get_absolute_path_static_handler', method='GET', headers={'XXX': 'xxx'}).status_code
-        assert 'text/html; charset=UTF-8' == cluster.instance.http_request('test_get_absolute_path_static_handler', method='GET', headers={'XXX': 'xxx'}).headers['Content-Type']
-        assert '<html><body>Absolute Path File</body></html>\n' == cluster.instance.http_request('test_get_absolute_path_static_handler', method='GET', headers={'XXX': 'xxx'}).content
+        assert 200 == cluster.instance.http_request('test_get_absolute_path_static_handler', method='GET',
+                                                    headers={'XXX': 'xxx'}).status_code
+        assert 'text/html; charset=UTF-8' == \
+               cluster.instance.http_request('test_get_absolute_path_static_handler', method='GET',
+                                             headers={'XXX': 'xxx'}).headers['Content-Type']
+        assert '<html><body>Absolute Path File</body></html>\n' == cluster.instance.http_request(
+            'test_get_absolute_path_static_handler', method='GET', headers={'XXX': 'xxx'}).content
 
 
 def test_relative_path_static_handler():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "static_handler", "test_static_handler")) as cluster:
+    with contextlib.closing(
+            SimpleCluster(ClickHouseCluster(__file__), "static_handler", "test_static_handler")) as cluster:
         cluster.instance.exec_in_container(
-            ['bash', '-c', 'echo "<html><body>Relative Path File</body></html>" > /var/lib/clickhouse/user_files/relative_path_file.html'],
+            ['bash', '-c',
+             'echo "<html><body>Relative Path File</body></html>" > /var/lib/clickhouse/user_files/relative_path_file.html'],
             privileged=True, user='root')
 
         assert 404 == cluster.instance.http_request('', method='GET', headers={'XXX': 'xxx'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_get_relative_path_static_handler', method='GET', headers={'XXX': 'bad'}).status_code
+        assert 404 == cluster.instance.http_request('test_get_relative_path_static_handler', method='GET',
+                                                    headers={'XXX': 'bad'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_get_relative_path_static_handler', method='POST', headers={'XXX': 'xxx'}).status_code
+        assert 404 == cluster.instance.http_request('test_get_relative_path_static_handler', method='POST',
+                                                    headers={'XXX': 'xxx'}).status_code
 
         # check default status code
-        assert 200 == cluster.instance.http_request('test_get_relative_path_static_handler', method='GET', headers={'XXX': 'xxx'}).status_code
-        assert 'text/html; charset=UTF-8' == cluster.instance.http_request('test_get_relative_path_static_handler', method='GET', headers={'XXX': 'xxx'}).headers['Content-Type']
-        assert '<html><body>Relative Path File</body></html>\n' == cluster.instance.http_request('test_get_relative_path_static_handler', method='GET', headers={'XXX': 'xxx'}).content
+        assert 200 == cluster.instance.http_request('test_get_relative_path_static_handler', method='GET',
+                                                    headers={'XXX': 'xxx'}).status_code
+        assert 'text/html; charset=UTF-8' == \
+               cluster.instance.http_request('test_get_relative_path_static_handler', method='GET',
+                                             headers={'XXX': 'xxx'}).headers['Content-Type']
+        assert '<html><body>Relative Path File</body></html>\n' == cluster.instance.http_request(
+            'test_get_relative_path_static_handler', method='GET', headers={'XXX': 'xxx'}).content
+
 
 def test_defaults_http_handlers():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "defaults_handlers", "test_defaults_handlers")) as cluster:
+    with contextlib.closing(
+            SimpleCluster(ClickHouseCluster(__file__), "defaults_handlers", "test_defaults_handlers")) as cluster:
         assert 200 == cluster.instance.http_request('', method='GET').status_code
         assert 'Default server response' == cluster.instance.http_request('', method='GET').content
 
@@ -130,24 +174,34 @@ def test_defaults_http_handlers():
         assert 200 == cluster.instance.http_request('?query=SELECT+1', method='GET').status_code
         assert '1\n' == cluster.instance.http_request('?query=SELECT+1', method='GET').content
 
+
 def test_prometheus_handler():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "prometheus_handler", "test_prometheus_handler")) as cluster:
+    with contextlib.closing(
+            SimpleCluster(ClickHouseCluster(__file__), "prometheus_handler", "test_prometheus_handler")) as cluster:
         assert 404 == cluster.instance.http_request('', method='GET', headers={'XXX': 'xxx'}).status_code
 
         assert 404 == cluster.instance.http_request('test_prometheus', method='GET', headers={'XXX': 'bad'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_prometheus', method='POST', headers={'XXX': 'xxx'}).status_code
+        assert 404 == cluster.instance.http_request('test_prometheus', method='POST',
+                                                    headers={'XXX': 'xxx'}).status_code
 
         assert 200 == cluster.instance.http_request('test_prometheus', method='GET', headers={'XXX': 'xxx'}).status_code
-        assert 'ClickHouseProfileEvents_Query' in cluster.instance.http_request('test_prometheus', method='GET', headers={'XXX': 'xxx'}).content
+        assert 'ClickHouseProfileEvents_Query' in cluster.instance.http_request('test_prometheus', method='GET',
+                                                                                headers={'XXX': 'xxx'}).content
+
 
 def test_replicas_status_handler():
-    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "replicas_status_handler", "test_replicas_status_handler")) as cluster:
+    with contextlib.closing(SimpleCluster(ClickHouseCluster(__file__), "replicas_status_handler",
+                                          "test_replicas_status_handler")) as cluster:
         assert 404 == cluster.instance.http_request('', method='GET', headers={'XXX': 'xxx'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_replicas_status', method='GET', headers={'XXX': 'bad'}).status_code
+        assert 404 == cluster.instance.http_request('test_replicas_status', method='GET',
+                                                    headers={'XXX': 'bad'}).status_code
 
-        assert 404 == cluster.instance.http_request('test_replicas_status', method='POST', headers={'XXX': 'xxx'}).status_code
+        assert 404 == cluster.instance.http_request('test_replicas_status', method='POST',
+                                                    headers={'XXX': 'xxx'}).status_code
 
-        assert 200 == cluster.instance.http_request('test_replicas_status', method='GET', headers={'XXX': 'xxx'}).status_code
-        assert 'Ok.\n' == cluster.instance.http_request('test_replicas_status', method='GET', headers={'XXX': 'xxx'}).content
+        assert 200 == cluster.instance.http_request('test_replicas_status', method='GET',
+                                                    headers={'XXX': 'xxx'}).status_code
+        assert 'Ok.\n' == cluster.instance.http_request('test_replicas_status', method='GET',
+                                                        headers={'XXX': 'xxx'}).content
diff --git a/tests/integration/test_https_replication/test.py b/tests/integration/test_https_replication/test.py
index 4974da850b4..84c2744923d 100644
--- a/tests/integration/test_https_replication/test.py
+++ b/tests/integration/test_https_replication/test.py
@@ -1,30 +1,36 @@
-import time
-import pytest
-
-from helpers.cluster import ClickHouseCluster
-
-from helpers.test_tools import assert_eq_with_retry
-from helpers.network import PartitionManager
-from multiprocessing.dummy import Pool
 import random
+import time
+from multiprocessing.dummy import Pool
+
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.network import PartitionManager
+from helpers.test_tools import assert_eq_with_retry
 
 """
 Both ssl_conf.xml and no_ssl_conf.xml have the same port
 """
 
+
 def _fill_nodes(nodes, shard):
     for node in nodes:
         node.query(
-        '''
-            CREATE DATABASE test;
+            '''
+                CREATE DATABASE test;
+    
+                CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}', date, id, 8192);
+            '''.format(shard=shard, replica=node.name))
 
-            CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}', date, id, 8192);
-        '''.format(shard=shard, replica=node.name))
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml', 'configs/ssl_conf.xml', "configs/server.crt", "configs/server.key", "configs/dhparam.pem"], with_zookeeper=True)
-node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml', 'configs/ssl_conf.xml', "configs/server.crt", "configs/server.key", "configs/dhparam.pem"], with_zookeeper=True)
+node1 = cluster.add_instance('node1',
+                             main_configs=['configs/remote_servers.xml', 'configs/ssl_conf.xml', "configs/server.crt",
+                                           "configs/server.key", "configs/dhparam.pem"], with_zookeeper=True)
+node2 = cluster.add_instance('node2',
+                             main_configs=['configs/remote_servers.xml', 'configs/ssl_conf.xml', "configs/server.crt",
+                                           "configs/server.key", "configs/dhparam.pem"], with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def both_https_cluster():
@@ -38,6 +44,7 @@ def both_https_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_both_https(both_https_cluster):
     node1.query("insert into test_table values ('2017-06-16', 111, 0)")
 
@@ -77,9 +84,11 @@ def test_replication_after_partition(both_https_cluster):
     assert_eq_with_retry(node2, "SELECT count() FROM test_table", '100')
 
 
+node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml', 'configs/no_ssl_conf.xml'],
+                             with_zookeeper=True)
+node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml', 'configs/no_ssl_conf.xml'],
+                             with_zookeeper=True)
 
-node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml', 'configs/no_ssl_conf.xml'], with_zookeeper=True)
-node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml', 'configs/no_ssl_conf.xml'], with_zookeeper=True)
 
 @pytest.fixture(scope="module")
 def both_http_cluster():
@@ -93,6 +102,7 @@ def both_http_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_both_http(both_http_cluster):
     node3.query("insert into test_table values ('2017-06-16', 111, 0)")
 
@@ -104,8 +114,13 @@ def test_both_http(both_http_cluster):
     assert_eq_with_retry(node3, "SELECT id FROM test_table order by id", '111\n222')
     assert_eq_with_retry(node4, "SELECT id FROM test_table order by id", '111\n222')
 
-node5 = cluster.add_instance('node5', main_configs=['configs/remote_servers.xml', 'configs/ssl_conf.xml', "configs/server.crt", "configs/server.key", "configs/dhparam.pem"], with_zookeeper=True)
-node6 = cluster.add_instance('node6', main_configs=['configs/remote_servers.xml', 'configs/no_ssl_conf.xml'], with_zookeeper=True)
+
+node5 = cluster.add_instance('node5',
+                             main_configs=['configs/remote_servers.xml', 'configs/ssl_conf.xml', "configs/server.crt",
+                                           "configs/server.key", "configs/dhparam.pem"], with_zookeeper=True)
+node6 = cluster.add_instance('node6', main_configs=['configs/remote_servers.xml', 'configs/no_ssl_conf.xml'],
+                             with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def mixed_protocol_cluster():
@@ -119,6 +134,7 @@ def mixed_protocol_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_mixed_protocol(mixed_protocol_cluster):
     node5.query("insert into test_table values ('2017-06-16', 111, 0)")
 
diff --git a/tests/integration/test_inherit_multiple_profiles/test.py b/tests/integration/test_inherit_multiple_profiles/test.py
index 1540196f9b6..658ccc3f51b 100644
--- a/tests/integration/test_inherit_multiple_profiles/test.py
+++ b/tests/integration/test_inherit_multiple_profiles/test.py
@@ -4,7 +4,6 @@ from helpers.client import QueryRuntimeException
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
-
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance',
                                 user_configs=['configs/combined_profile.xml'])
diff --git a/tests/integration/test_input_format_parallel_parsing_memory_tracking/test.py b/tests/integration/test_input_format_parallel_parsing_memory_tracking/test.py
index 06a1a72162d..69c7a5821fd 100644
--- a/tests/integration/test_input_format_parallel_parsing_memory_tracking/test.py
+++ b/tests/integration/test_input_format_parallel_parsing_memory_tracking/test.py
@@ -10,6 +10,7 @@ cluster = ClickHouseCluster(__file__)
 
 instance = cluster.add_instance('instance', main_configs=['configs/conf.xml'])
 
+
 @pytest.fixture(scope='module', autouse=True)
 def start_cluster():
     try:
@@ -18,6 +19,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 # max_memory_usage_for_user cannot be used, since the memory for user accounted
 # correctly, only total is not
 def test_memory_tracking_total():
@@ -25,9 +27,10 @@ def test_memory_tracking_total():
         CREATE TABLE null (row String) ENGINE=Null;
     ''')
     instance.exec_in_container(['bash', '-c',
-        'clickhouse client -q "SELECT arrayStringConcat(arrayMap(x->toString(cityHash64(x)), range(1000)), \' \') from numbers(10000)" > data.json'])
+                                'clickhouse client -q "SELECT arrayStringConcat(arrayMap(x->toString(cityHash64(x)), range(1000)), \' \') from numbers(10000)" > data.json'])
     for it in range(0, 20):
         # the problem can be triggered only via HTTP,
         # since clickhouse-client parses the data by itself.
         assert instance.exec_in_container(['curl', '--silent', '--show-error', '--data-binary', '@data.json',
-            'http://127.1:8123/?query=INSERT%20INTO%20null%20FORMAT%20TSV']) == '', 'Failed on {} iteration'.format(it)
+                                           'http://127.1:8123/?query=INSERT%20INTO%20null%20FORMAT%20TSV']) == '', 'Failed on {} iteration'.format(
+            it)
diff --git a/tests/integration/test_insert_distributed_load_balancing/test.py b/tests/integration/test_insert_distributed_load_balancing/test.py
index 52ee3ba1c4a..29cc953280f 100644
--- a/tests/integration/test_insert_distributed_load_balancing/test.py
+++ b/tests/integration/test_insert_distributed_load_balancing/test.py
@@ -16,6 +16,7 @@ params = pytest.mark.parametrize('cluster,q', [
     ('no_internal_replication', 1),
 ])
 
+
 @pytest.fixture(scope='module', autouse=True)
 def start_cluster():
     try:
@@ -24,6 +25,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def create_tables(cluster):
     n1.query('DROP TABLE IF EXISTS data')
     n2.query('DROP TABLE IF EXISTS data')
@@ -41,37 +43,43 @@ def create_tables(cluster):
     )
     """.format(cluster=cluster))
 
+
 def insert_data(cluster, **settings):
     create_tables(cluster)
     n1.query('INSERT INTO dist SELECT * FROM numbers(10)', settings=settings)
     n1.query('SYSTEM FLUSH DISTRIBUTED dist')
 
+
 @params
 def test_prefer_localhost_replica_1(cluster, q):
     insert_data(cluster)
     assert int(n1.query('SELECT count() FROM data')) == 10
-    assert int(n2.query('SELECT count() FROM data')) == 10*q
+    assert int(n2.query('SELECT count() FROM data')) == 10 * q
+
 
 @params
 def test_prefer_localhost_replica_1_load_balancing_in_order(cluster, q):
     insert_data(cluster, load_balancing='in_order')
     assert int(n1.query('SELECT count() FROM data')) == 10
-    assert int(n2.query('SELECT count() FROM data')) == 10*q
+    assert int(n2.query('SELECT count() FROM data')) == 10 * q
+
 
 @params
 def test_prefer_localhost_replica_0_load_balancing_nearest_hostname(cluster, q):
     insert_data(cluster, load_balancing='nearest_hostname', prefer_localhost_replica=0)
     assert int(n1.query('SELECT count() FROM data')) == 10
-    assert int(n2.query('SELECT count() FROM data')) == 10*q
+    assert int(n2.query('SELECT count() FROM data')) == 10 * q
+
 
 @params
 def test_prefer_localhost_replica_0_load_balancing_in_order(cluster, q):
     insert_data(cluster, load_balancing='in_order', prefer_localhost_replica=0)
-    assert int(n1.query('SELECT count() FROM data')) == 10*q
+    assert int(n1.query('SELECT count() FROM data')) == 10 * q
     assert int(n2.query('SELECT count() FROM data')) == 10
 
+
 @params
 def test_prefer_localhost_replica_0_load_balancing_in_order_sync(cluster, q):
     insert_data(cluster, load_balancing='in_order', prefer_localhost_replica=0, insert_distributed_sync=1)
-    assert int(n1.query('SELECT count() FROM data')) == 10*q
+    assert int(n1.query('SELECT count() FROM data')) == 10 * q
     assert int(n2.query('SELECT count() FROM data')) == 10
diff --git a/tests/integration/test_insert_into_distributed/test.py b/tests/integration/test_insert_into_distributed/test.py
index 731ffbbe2fd..52beaf06ec2 100644
--- a/tests/integration/test_insert_into_distributed/test.py
+++ b/tests/integration/test_insert_into_distributed/test.py
@@ -1,11 +1,10 @@
-import pytest
 import time
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
 from helpers.test_tools import TSV
 
-
 cluster = ClickHouseCluster(__file__)
 
 instance_test_reconnect = cluster.add_instance('instance_test_reconnect', main_configs=['configs/remote_servers.xml'])
@@ -24,6 +23,7 @@ node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'
 shard1 = cluster.add_instance('shard1', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 shard2 = cluster.add_instance('shard2', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -39,7 +39,8 @@ CREATE TABLE distributed (x UInt32) ENGINE = Distributed('test_cluster', 'defaul
 CREATE TABLE distributed (d Date, x UInt32) ENGINE = Distributed('test_cluster', 'default', 'local2')
 ''')
 
-        instance_test_inserts_local_cluster.query("CREATE TABLE local (d Date, x UInt32) ENGINE = MergeTree(d, x, 8192)")
+        instance_test_inserts_local_cluster.query(
+            "CREATE TABLE local (d Date, x UInt32) ENGINE = MergeTree(d, x, 8192)")
         instance_test_inserts_local_cluster.query('''
 CREATE TABLE distributed_on_local (d Date, x UInt32) ENGINE = Distributed('test_local_cluster', 'default', 'local')
 ''')
@@ -74,8 +75,6 @@ CREATE TABLE table_function (n UInt8, s String) ENGINE = MergeTree() ORDER BY n'
         node2.query('''
 CREATE TABLE table_function (n UInt8, s String) ENGINE = MergeTree() ORDER BY n''')
 
-
-
         yield cluster
 
     finally:
@@ -162,6 +161,7 @@ def test_inserts_local(started_cluster):
     time.sleep(0.5)
     assert instance.query("SELECT count(*) FROM local").strip() == '1'
 
+
 def test_prefer_localhost_replica(started_cluster):
     test_query = "SELECT * FROM distributed ORDER BY id"
 
@@ -174,13 +174,13 @@ def test_prefer_localhost_replica(started_cluster):
 2017-06-17\t22
 '''
 
-    expected_from_node2 =  '''\
+    expected_from_node2 = '''\
 2017-06-17\t11
 2017-06-17\t22
 2017-06-17\t44
 '''
 
-    expected_from_node1 =  '''\
+    expected_from_node1 = '''\
 2017-06-17\t11
 2017-06-17\t22
 2017-06-17\t33
@@ -204,7 +204,9 @@ def test_prefer_localhost_replica(started_cluster):
     assert TSV(node2.query(test_query)) == TSV(expected_from_node2)
 
     # Now query is sent to node1, as it higher in order
-    assert TSV(node2.query(test_query + " SETTINGS load_balancing='in_order', prefer_localhost_replica=0")) == TSV(expected_from_node1)
+    assert TSV(node2.query(test_query + " SETTINGS load_balancing='in_order', prefer_localhost_replica=0")) == TSV(
+        expected_from_node1)
+
 
 def test_inserts_low_cardinality(started_cluster):
     instance = shard1
@@ -212,6 +214,9 @@ def test_inserts_low_cardinality(started_cluster):
     time.sleep(0.5)
     assert instance.query("SELECT count(*) FROM low_cardinality_all").strip() == '1'
 
+
 def test_table_function(started_cluster):
-    node1.query("insert into table function cluster('shard_with_local_replica', 'default', 'table_function') select number, concat('str_', toString(number)) from numbers(100000)")
-    assert node1.query("select count() from cluster('shard_with_local_replica', 'default', 'table_function')").rstrip() == '100000'
+    node1.query(
+        "insert into table function cluster('shard_with_local_replica', 'default', 'table_function') select number, concat('str_', toString(number)) from numbers(100000)")
+    assert node1.query(
+        "select count() from cluster('shard_with_local_replica', 'default', 'table_function')").rstrip() == '100000'
diff --git a/tests/integration/test_insert_into_distributed_sync_async/test.py b/tests/integration/test_insert_into_distributed_sync_async/test.py
index 1b713f17660..30c80e50c43 100755
--- a/tests/integration/test_insert_into_distributed_sync_async/test.py
+++ b/tests/integration/test_insert_into_distributed_sync_async/test.py
@@ -1,11 +1,11 @@
 #!/usr/bin/env python2
-import sys
 import os
+import sys
 from contextlib import contextmanager
+
 import pytest
 
 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
-from helpers.network import PartitionManager
 from helpers.test_tools import TSV
 from helpers.cluster import ClickHouseCluster
 from helpers.client import QueryRuntimeException, QueryTimeoutExceedException
@@ -15,6 +15,7 @@ cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'])
 node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'])
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -25,7 +26,6 @@ def started_cluster():
 CREATE TABLE local_table(date Date, val UInt64) ENGINE = MergeTree(date, (date, val), 8192);
 ''')
 
-
         node1.query('''
 CREATE TABLE distributed_table(date Date, val UInt64) ENGINE = Distributed(test_cluster, default, local_table)
 ''')
@@ -37,7 +37,6 @@ CREATE TABLE distributed_table(date Date, val UInt64) ENGINE = Distributed(test_
 
 
 def test_insertion_sync(started_cluster):
-
     node1.query('''SET insert_distributed_sync = 1, insert_distributed_timeout = 0;
     INSERT INTO distributed_table SELECT today() as date, number as val FROM system.numbers LIMIT 10000''')
 
@@ -105,8 +104,9 @@ def test_insertion_sync_with_disabled_timeout(started_cluster):
 
 def test_async_inserts_into_local_shard(started_cluster):
     node1.query('''CREATE TABLE shard_local (i Int64) ENGINE = Memory''')
-    node1.query('''CREATE TABLE shard_distributed (i Int64) ENGINE = Distributed(local_shard_with_internal_replication, default, shard_local)''')
-    node1.query('''INSERT INTO shard_distributed VALUES (1)''', settings={ "insert_distributed_sync" : 0 })
+    node1.query(
+        '''CREATE TABLE shard_distributed (i Int64) ENGINE = Distributed(local_shard_with_internal_replication, default, shard_local)''')
+    node1.query('''INSERT INTO shard_distributed VALUES (1)''', settings={"insert_distributed_sync": 0})
 
     assert TSV(node1.query('''SELECT count() FROM shard_distributed''')) == TSV("1\n")
     node1.query('''DETACH TABLE shard_distributed''')
diff --git a/tests/integration/test_insert_into_distributed_through_materialized_view/test.py b/tests/integration/test_insert_into_distributed_through_materialized_view/test.py
index 1df803920f1..32edb6829c8 100644
--- a/tests/integration/test_insert_into_distributed_through_materialized_view/test.py
+++ b/tests/integration/test_insert_into_distributed_through_materialized_view/test.py
@@ -1,11 +1,10 @@
-import pytest
 import time
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
 from helpers.test_tools import TSV
 
-
 cluster = ClickHouseCluster(__file__)
 
 instance_test_reconnect = cluster.add_instance('instance_test_reconnect', main_configs=['configs/remote_servers.xml'])
@@ -30,24 +29,26 @@ def started_cluster():
 CREATE TABLE distributed (x UInt32) ENGINE = Distributed('test_cluster', 'default', 'local1')
 ''')
         instance_test_reconnect.query("CREATE TABLE local1_source (x UInt32) ENGINE = Memory")
-        instance_test_reconnect.query("CREATE MATERIALIZED VIEW local1_view to distributed AS SELECT x FROM local1_source")
+        instance_test_reconnect.query(
+            "CREATE MATERIALIZED VIEW local1_view to distributed AS SELECT x FROM local1_source")
 
         remote.query("CREATE TABLE local2 (d Date, x UInt32, s String) ENGINE = MergeTree(d, x, 8192)")
         instance_test_inserts_batching.query('''
 CREATE TABLE distributed (d Date, x UInt32) ENGINE = Distributed('test_cluster', 'default', 'local2')
 ''')
         instance_test_inserts_batching.query("CREATE TABLE local2_source (d Date, x UInt32) ENGINE = Log")
-        instance_test_inserts_batching.query("CREATE MATERIALIZED VIEW local2_view to distributed AS SELECT d,x FROM local2_source")
-
+        instance_test_inserts_batching.query(
+            "CREATE MATERIALIZED VIEW local2_view to distributed AS SELECT d,x FROM local2_source")
 
         instance_test_inserts_local_cluster.query("CREATE TABLE local_source (d Date, x UInt32) ENGINE = Memory")
-        instance_test_inserts_local_cluster.query("CREATE MATERIALIZED VIEW local_view to distributed_on_local AS SELECT d,x FROM local_source")
-        instance_test_inserts_local_cluster.query("CREATE TABLE local (d Date, x UInt32) ENGINE = MergeTree(d, x, 8192)")
+        instance_test_inserts_local_cluster.query(
+            "CREATE MATERIALIZED VIEW local_view to distributed_on_local AS SELECT d,x FROM local_source")
+        instance_test_inserts_local_cluster.query(
+            "CREATE TABLE local (d Date, x UInt32) ENGINE = MergeTree(d, x, 8192)")
         instance_test_inserts_local_cluster.query('''
 CREATE TABLE distributed_on_local (d Date, x UInt32) ENGINE = Distributed('test_local_cluster', 'default', 'local')
 ''')
 
-
         yield cluster
 
     finally:
@@ -78,6 +79,7 @@ def test_reconnect(started_cluster):
 
         assert remote.query("SELECT count(*) FROM local1").strip() == '3'
 
+
 @pytest.mark.skip(reason="Flapping test")
 def test_inserts_batching(started_cluster):
     instance = instance_test_inserts_batching
diff --git a/tests/integration/test_live_view_over_distributed/test.py b/tests/integration/test_live_view_over_distributed/test.py
index 1ae9a4b5199..67ff4d8dfe7 100644
--- a/tests/integration/test_live_view_over_distributed/test.py
+++ b/tests/integration/test_live_view_over_distributed/test.py
@@ -1,16 +1,10 @@
 from __future__ import print_function
 
 import sys
-import itertools
-import timeit
-import logging
 
 import pytest
-
-from helpers.uclient import client, prompt, end_of_block
 from helpers.cluster import ClickHouseCluster
-from helpers.network import PartitionManager
-from helpers.test_tools import TSV
+from helpers.uclient import client, prompt, end_of_block
 
 cluster = ClickHouseCluster(__file__)
 
@@ -45,6 +39,7 @@ CREATE LIVE VIEW lv_over_distributed_table AS SELECT * FROM distributed_table;
 
 INSERT_SQL_TEMPLATE = "INSERT INTO base_table VALUES ('{node_id}', {key}, {value})"
 
+
 @pytest.fixture(scope="function")
 def started_cluster():
     try:
@@ -73,7 +68,7 @@ node2\t1\t11
 
     def test_select_with_order_by_key(self, started_cluster, node, source):
         assert node.query("SELECT * FROM {source} ORDER BY key, node".format(source=source)) \
-            == """node1\t0\t0
+               == """node1\t0\t0
 node2\t0\t10
 node1\t1\t1
 node2\t1\t11
@@ -81,15 +76,15 @@ node2\t1\t11
 
     def test_select_with_group_by_node(self, started_cluster, node, source):
         assert node.query("SELECT node, SUM(value) FROM {source} GROUP BY node ORDER BY node".format(source=source)) \
-            == "node1\t1\nnode2\t21\n"
+               == "node1\t1\nnode2\t21\n"
 
     def test_select_with_group_by_key(self, started_cluster, node, source):
         assert node.query("SELECT key, SUM(value) FROM {source} GROUP BY key ORDER BY key".format(source=source)) \
-            == "0\t10\n1\t12\n"
+               == "0\t10\n1\t12\n"
 
     def test_select_sum(self, started_cluster, node, source):
         assert node.query("SELECT SUM(value) FROM {source}".format(source=source)) \
-            == "22\n"
+               == "22\n"
 
     def test_watch_live_view_order_by_node(self, started_cluster, node, source):
         log = sys.stdout
@@ -193,7 +188,8 @@ node2\t1\t11
 
             client1.send("DROP TABLE IF EXISTS lv")
             client1.expect(prompt)
-            client1.send("CREATE LIVE VIEW lv AS SELECT node, SUM(value) FROM distributed_table GROUP BY node ORDER BY node")
+            client1.send(
+                "CREATE LIVE VIEW lv AS SELECT node, SUM(value) FROM distributed_table GROUP BY node ORDER BY node")
             client1.expect(prompt)
 
             client1.send("WATCH lv FORMAT CSV")
@@ -227,7 +223,8 @@ node2\t1\t11
 
             client1.send("DROP TABLE IF EXISTS lv")
             client1.expect(prompt)
-            client1.send("CREATE LIVE VIEW lv AS SELECT key, SUM(value) FROM distributed_table GROUP BY key ORDER BY key")
+            client1.send(
+                "CREATE LIVE VIEW lv AS SELECT key, SUM(value) FROM distributed_table GROUP BY key ORDER BY key")
             client1.expect(prompt)
 
             client1.send("WATCH lv FORMAT CSV")
@@ -247,7 +244,6 @@ node2\t1\t11
             client1.expect('2,2,3')
             client1.expect('3,3,3')
 
-
     def test_watch_live_view_sum(self, started_cluster, node, source):
         log = sys.stdout
         command = " ".join(node.client.command)
diff --git a/tests/integration/test_log_family_s3/test.py b/tests/integration/test_log_family_s3/test.py
index 3b0d847967b..40e263c9c69 100644
--- a/tests/integration/test_log_family_s3/test.py
+++ b/tests/integration/test_log_family_s3/test.py
@@ -11,7 +11,9 @@ logging.getLogger().addHandler(logging.StreamHandler())
 def cluster():
     try:
         cluster = ClickHouseCluster(__file__)
-        cluster.add_instance("node", main_configs=["configs/minio.xml", "configs/ssl.xml", "configs/config.d/log_conf.xml"], with_minio=True)
+        cluster.add_instance("node",
+                             main_configs=["configs/minio.xml", "configs/ssl.xml", "configs/config.d/log_conf.xml"],
+                             with_minio=True)
         logging.info("Starting cluster...")
         cluster.start()
         logging.info("Cluster started")
@@ -36,11 +38,13 @@ def test_log_family_s3(cluster, log_engine, files_overhead, files_overhead_per_i
 
     node.query("INSERT INTO s3_test SELECT number + 5 FROM numbers(3)")
     assert node.query("SELECT * FROM s3_test order by id") == "0\n1\n2\n3\n4\n5\n6\n7\n"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == files_overhead_per_insert * 2 + files_overhead
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == files_overhead_per_insert * 2 + files_overhead
 
     node.query("INSERT INTO s3_test SELECT number + 8 FROM numbers(1)")
     assert node.query("SELECT * FROM s3_test order by id") == "0\n1\n2\n3\n4\n5\n6\n7\n8\n"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == files_overhead_per_insert * 3 + files_overhead
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == files_overhead_per_insert * 3 + files_overhead
 
     node.query("TRUNCATE TABLE s3_test")
     assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == 0
diff --git a/tests/integration/test_logs_level/test.py b/tests/integration/test_logs_level/test.py
index 302686b6fa0..9aa3f7ffd9a 100644
--- a/tests/integration/test_logs_level/test.py
+++ b/tests/integration/test_logs_level/test.py
@@ -5,6 +5,7 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', main_configs=['configs/config_information.xml'])
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -13,6 +14,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_check_client_logs_level(start_cluster):
     logs = node.query_and_get_answer_with_error("SELECT 1", settings={"send_logs_level": 'trace'})[1]
     assert logs.count('Trace') != 0
diff --git a/tests/integration/test_match_process_uid_against_data_owner/test.py b/tests/integration/test_match_process_uid_against_data_owner/test.py
index 77cbe25ff80..c9f87e683c8 100644
--- a/tests/integration/test_match_process_uid_against_data_owner/test.py
+++ b/tests/integration/test_match_process_uid_against_data_owner/test.py
@@ -1,9 +1,9 @@
-import docker
 import os
 import pwd
-import pytest
 import re
 
+import docker
+import pytest
 from helpers.cluster import ClickHouseCluster, CLICKHOUSE_START_COMMAND
 
 
@@ -27,11 +27,13 @@ def test_different_user():
     container.exec_run('chown {} /var/lib/clickhouse'.format(other_user_id), privileged=True)
     container.exec_run(CLICKHOUSE_START_COMMAND)
 
-    cluster.shutdown() # cleanup
+    cluster.shutdown()  # cleanup
 
     with open(os.path.join(node.path, 'logs/clickhouse-server.err.log')) as log:
         expected_message = "Effective user of the process \(.*\) does not match the owner of the data \(.*\)\. Run under 'sudo -u .*'\."
         last_message = log.readlines()[-1].strip()
 
         if re.search(expected_message, last_message) is None:
-            pytest.fail('Expected the server to fail with a message "{}", but the last message is "{}"'.format(expected_message, last_message))
+            pytest.fail(
+                'Expected the server to fail with a message "{}", but the last message is "{}"'.format(expected_message,
+                                                                                                       last_message))
diff --git a/tests/integration/test_materialize_mysql_database/materialize_with_ddl.py b/tests/integration/test_materialize_mysql_database/materialize_with_ddl.py
index dbf86044583..a0a3b0b1cb6 100644
--- a/tests/integration/test_materialize_mysql_database/materialize_with_ddl.py
+++ b/tests/integration/test_materialize_mysql_database/materialize_with_ddl.py
@@ -1,4 +1,5 @@
 import time
+
 import pymysql.cursors
 
 
@@ -21,73 +22,75 @@ def dml_with_materialize_mysql_database(clickhouse_node, mysql_node, service_nam
     # existed before the mapping was created
 
     mysql_node.query("CREATE TABLE test_database.test_table_1 ("
-        "`key` INT NOT NULL PRIMARY KEY, "
-        "unsigned_tiny_int TINYINT UNSIGNED, tiny_int TINYINT, "
-        "unsigned_small_int SMALLINT UNSIGNED, small_int SMALLINT, "
-        "unsigned_medium_int MEDIUMINT UNSIGNED, medium_int MEDIUMINT, "
-        "unsigned_int INT UNSIGNED, _int INT, "
-        "unsigned_integer INTEGER UNSIGNED, _integer INTEGER, "
-        "unsigned_bigint BIGINT UNSIGNED, _bigint BIGINT, "
-        "/* Need ClickHouse support read mysql decimal unsigned_decimal DECIMAL(19, 10) UNSIGNED, _decimal DECIMAL(19, 10), */"
-        "unsigned_float FLOAT UNSIGNED, _float FLOAT, "
-        "unsigned_double DOUBLE UNSIGNED, _double DOUBLE, "
-        "_varchar VARCHAR(10), _char CHAR(10), "
-        "/* Need ClickHouse support Enum('a', 'b', 'v') _enum ENUM('a', 'b', 'c'), */"
-        "_date Date, _datetime DateTime, _timestamp TIMESTAMP, _bool BOOLEAN) ENGINE = InnoDB;")
+                     "`key` INT NOT NULL PRIMARY KEY, "
+                     "unsigned_tiny_int TINYINT UNSIGNED, tiny_int TINYINT, "
+                     "unsigned_small_int SMALLINT UNSIGNED, small_int SMALLINT, "
+                     "unsigned_medium_int MEDIUMINT UNSIGNED, medium_int MEDIUMINT, "
+                     "unsigned_int INT UNSIGNED, _int INT, "
+                     "unsigned_integer INTEGER UNSIGNED, _integer INTEGER, "
+                     "unsigned_bigint BIGINT UNSIGNED, _bigint BIGINT, "
+                     "/* Need ClickHouse support read mysql decimal unsigned_decimal DECIMAL(19, 10) UNSIGNED, _decimal DECIMAL(19, 10), */"
+                     "unsigned_float FLOAT UNSIGNED, _float FLOAT, "
+                     "unsigned_double DOUBLE UNSIGNED, _double DOUBLE, "
+                     "_varchar VARCHAR(10), _char CHAR(10), "
+                     "/* Need ClickHouse support Enum('a', 'b', 'v') _enum ENUM('a', 'b', 'c'), */"
+                     "_date Date, _datetime DateTime, _timestamp TIMESTAMP, _bool BOOLEAN) ENGINE = InnoDB;")
 
     # it already has some data
     mysql_node.query(
         "INSERT INTO test_database.test_table_1 VALUES(1, 1, -1, 2, -2, 3, -3, 4, -4, 5, -5, 6, -6, 3.2, -3.2, 3.4, -3.4, 'varchar', 'char', "
         "'2020-01-01', '2020-01-01 00:00:00', '2020-01-01 00:00:00', true);")
 
-    clickhouse_node.query("CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+    clickhouse_node.query(
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\n")
     check_query(clickhouse_node, "SELECT * FROM test_database.test_table_1 ORDER BY key FORMAT TSV",
-        "1\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t"
-        "2020-01-01 00:00:00\t2020-01-01 00:00:00\t1\n")
+                "1\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t"
+                "2020-01-01 00:00:00\t2020-01-01 00:00:00\t1\n")
 
     mysql_node.query(
         "INSERT INTO test_database.test_table_1 VALUES(2, 1, -1, 2, -2, 3, -3, 4, -4, 5, -5, 6, -6, 3.2, -3.2, 3.4, -3.4, 'varchar', 'char', "
         "'2020-01-01', '2020-01-01 00:00:00', '2020-01-01 00:00:00', false);")
 
     check_query(clickhouse_node, "SELECT * FROM test_database.test_table_1 ORDER BY key FORMAT TSV",
-        "1\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t"
-        "2020-01-01 00:00:00\t2020-01-01 00:00:00\t1\n2\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\t"
-        "varchar\tchar\t2020-01-01\t2020-01-01 00:00:00\t2020-01-01 00:00:00\t0\n")
+                "1\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t"
+                "2020-01-01 00:00:00\t2020-01-01 00:00:00\t1\n2\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\t"
+                "varchar\tchar\t2020-01-01\t2020-01-01 00:00:00\t2020-01-01 00:00:00\t0\n")
 
     mysql_node.query("UPDATE test_database.test_table_1 SET unsigned_tiny_int = 2 WHERE `key` = 1")
 
     check_query(clickhouse_node, "SELECT key, unsigned_tiny_int, tiny_int, unsigned_small_int,"
-        " small_int, unsigned_medium_int, medium_int, unsigned_int, _int, unsigned_integer, _integer, "
-        " unsigned_bigint, _bigint, unsigned_float, _float, unsigned_double, _double, _varchar, _char, "
-        " _date, _datetime, /* exclude it, because ON UPDATE CURRENT_TIMESTAMP _timestamp, */ "
-        " _bool FROM test_database.test_table_1 ORDER BY key FORMAT TSV",
-        "1\t2\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t"
-        "2020-01-01 00:00:00\t1\n2\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\t"
-        "varchar\tchar\t2020-01-01\t2020-01-01 00:00:00\t0\n")
+                                 " small_int, unsigned_medium_int, medium_int, unsigned_int, _int, unsigned_integer, _integer, "
+                                 " unsigned_bigint, _bigint, unsigned_float, _float, unsigned_double, _double, _varchar, _char, "
+                                 " _date, _datetime, /* exclude it, because ON UPDATE CURRENT_TIMESTAMP _timestamp, */ "
+                                 " _bool FROM test_database.test_table_1 ORDER BY key FORMAT TSV",
+                "1\t2\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t"
+                "2020-01-01 00:00:00\t1\n2\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\t"
+                "varchar\tchar\t2020-01-01\t2020-01-01 00:00:00\t0\n")
 
     # update primary key
     mysql_node.query("UPDATE test_database.test_table_1 SET `key` = 3 WHERE `unsigned_tiny_int` = 2")
 
     check_query(clickhouse_node, "SELECT key, unsigned_tiny_int, tiny_int, unsigned_small_int,"
-        " small_int, unsigned_medium_int, medium_int, unsigned_int, _int, unsigned_integer, _integer, "
-        " unsigned_bigint, _bigint, unsigned_float, _float, unsigned_double, _double, _varchar, _char, "
-        " _date, _datetime, /* exclude it, because ON UPDATE CURRENT_TIMESTAMP _timestamp, */ "
-        " _bool FROM test_database.test_table_1 ORDER BY key FORMAT TSV",
-        "2\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\t"
-        "varchar\tchar\t2020-01-01\t2020-01-01 00:00:00\t0\n3\t2\t-1\t2\t-2\t3\t-3\t"
-        "4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t2020-01-01 00:00:00\t1\n")
+                                 " small_int, unsigned_medium_int, medium_int, unsigned_int, _int, unsigned_integer, _integer, "
+                                 " unsigned_bigint, _bigint, unsigned_float, _float, unsigned_double, _double, _varchar, _char, "
+                                 " _date, _datetime, /* exclude it, because ON UPDATE CURRENT_TIMESTAMP _timestamp, */ "
+                                 " _bool FROM test_database.test_table_1 ORDER BY key FORMAT TSV",
+                "2\t1\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\t"
+                "varchar\tchar\t2020-01-01\t2020-01-01 00:00:00\t0\n3\t2\t-1\t2\t-2\t3\t-3\t"
+                "4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t2020-01-01 00:00:00\t1\n")
 
     mysql_node.query('DELETE FROM test_database.test_table_1 WHERE `key` = 2')
     check_query(clickhouse_node, "SELECT key, unsigned_tiny_int, tiny_int, unsigned_small_int,"
-        " small_int, unsigned_medium_int, medium_int, unsigned_int, _int, unsigned_integer, _integer, "
-        " unsigned_bigint, _bigint, unsigned_float, _float, unsigned_double, _double, _varchar, _char, "
-        " _date, _datetime, /* exclude it, because ON UPDATE CURRENT_TIMESTAMP _timestamp, */ "
-        " _bool FROM test_database.test_table_1 ORDER BY key FORMAT TSV",
-        "3\t2\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t"
-        "2020-01-01 00:00:00\t1\n")
+                                 " small_int, unsigned_medium_int, medium_int, unsigned_int, _int, unsigned_integer, _integer, "
+                                 " unsigned_bigint, _bigint, unsigned_float, _float, unsigned_double, _double, _varchar, _char, "
+                                 " _date, _datetime, /* exclude it, because ON UPDATE CURRENT_TIMESTAMP _timestamp, */ "
+                                 " _bool FROM test_database.test_table_1 ORDER BY key FORMAT TSV",
+                "3\t2\t-1\t2\t-2\t3\t-3\t4\t-4\t5\t-5\t6\t-6\t3.2\t-3.2\t3.4\t-3.4\tvarchar\tchar\t2020-01-01\t"
+                "2020-01-01 00:00:00\t1\n")
 
     mysql_node.query('DELETE FROM test_database.test_table_1 WHERE `unsigned_tiny_int` = 2')
     check_query(clickhouse_node, "SELECT * FROM test_database.test_table_1 ORDER BY key FORMAT TSV", "")
@@ -108,7 +111,8 @@ def drop_table_with_materialize_mysql_database(clickhouse_node, mysql_node, serv
 
     # create mapping
     clickhouse_node.query(
-        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_2\n")
@@ -117,7 +121,8 @@ def drop_table_with_materialize_mysql_database(clickhouse_node, mysql_node, serv
     mysql_node.query("INSERT INTO test_database.test_table_2 VALUES(1), (2), (3), (4), (5), (6)")
     mysql_node.query("CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY) ENGINE = InnoDB;")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\ntest_table_2\n")
-    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV", "1\n2\n3\n4\n5\n6\n")
+    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV",
+                "1\n2\n3\n4\n5\n6\n")
 
     mysql_node.query("DROP TABLE test_database.test_table_1;")
     mysql_node.query("TRUNCATE TABLE test_database.test_table_2;")
@@ -136,17 +141,21 @@ def create_table_with_materialize_mysql_database(clickhouse_node, mysql_node, se
     mysql_node.query("INSERT INTO test_database.test_table_1 VALUES(1), (2), (3), (5), (6), (7);")
 
     # create mapping
-    clickhouse_node.query("CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+    clickhouse_node.query(
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     # Check for pre-existing status
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\n")
-    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_1 ORDER BY id FORMAT TSV", "1\n2\n3\n5\n6\n7\n")
+    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_1 ORDER BY id FORMAT TSV",
+                "1\n2\n3\n5\n6\n7\n")
 
     mysql_node.query("CREATE TABLE test_database.test_table_2 (id INT NOT NULL PRIMARY KEY) ENGINE = InnoDB;")
     mysql_node.query("INSERT INTO test_database.test_table_2 VALUES(1), (2), (3), (4), (5), (6);")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\ntest_table_2\n")
-    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV", "1\n2\n3\n4\n5\n6\n")
+    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV",
+                "1\n2\n3\n4\n5\n6\n")
 
     clickhouse_node.query("DROP DATABASE test_database")
     mysql_node.query("DROP DATABASE test_database")
@@ -160,7 +169,8 @@ def rename_table_with_materialize_mysql_database(clickhouse_node, mysql_node, se
 
     # create mapping
     clickhouse_node.query(
-        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_2\n")
@@ -178,30 +188,35 @@ def alter_add_column_with_materialize_mysql_database(clickhouse_node, mysql_node
     mysql_node.query("ALTER TABLE test_database.test_table_1 ADD COLUMN add_column_1 INT NOT NULL")
     mysql_node.query("ALTER TABLE test_database.test_table_1 ADD COLUMN add_column_2 INT NOT NULL FIRST")
     mysql_node.query("ALTER TABLE test_database.test_table_1 ADD COLUMN add_column_3 INT NOT NULL AFTER add_column_1")
-    mysql_node.query("ALTER TABLE test_database.test_table_1 ADD COLUMN add_column_4 INT NOT NULL DEFAULT " + ("0" if service_name == "mysql1" else "(id)"))
+    mysql_node.query("ALTER TABLE test_database.test_table_1 ADD COLUMN add_column_4 INT NOT NULL DEFAULT " + (
+        "0" if service_name == "mysql1" else "(id)"))
 
     # create mapping
     clickhouse_node.query(
-        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\n")
     check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV",
-        "add_column_2\tInt32\t\t\t\t\t\nid\tInt32\t\t\t\t\t\nadd_column_1\tInt32\t\t\t\t\t\nadd_column_3\tInt32\t\t\t\t\t\nadd_column_4\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+                "add_column_2\tInt32\t\t\t\t\t\nid\tInt32\t\t\t\t\t\nadd_column_1\tInt32\t\t\t\t\t\nadd_column_3\tInt32\t\t\t\t\t\nadd_column_4\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
     mysql_node.query("CREATE TABLE test_database.test_table_2 (id INT NOT NULL PRIMARY KEY) ENGINE = InnoDB;")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\ntest_table_2\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
-    mysql_node.query("ALTER TABLE test_database.test_table_2 ADD COLUMN add_column_1 INT NOT NULL, ADD COLUMN add_column_2 INT NOT NULL FIRST")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    mysql_node.query(
+        "ALTER TABLE test_database.test_table_2 ADD COLUMN add_column_1 INT NOT NULL, ADD COLUMN add_column_2 INT NOT NULL FIRST")
     mysql_node.query(
         "ALTER TABLE test_database.test_table_2 ADD COLUMN add_column_3 INT NOT NULL AFTER add_column_1, ADD COLUMN add_column_4 INT NOT NULL DEFAULT " + (
             "0" if service_name == "mysql1" else "(id)"))
 
     default_expression = "DEFAULT\t0" if service_name == "mysql1" else "DEFAULT\tid"
     check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
-        "add_column_2\tInt32\t\t\t\t\t\nid\tInt32\t\t\t\t\t\nadd_column_1\tInt32\t\t\t\t\t\nadd_column_3\tInt32\t\t\t\t\t\nadd_column_4\tInt32\t" + default_expression + "\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+                "add_column_2\tInt32\t\t\t\t\t\nid\tInt32\t\t\t\t\t\nadd_column_1\tInt32\t\t\t\t\t\nadd_column_3\tInt32\t\t\t\t\t\nadd_column_4\tInt32\t" + default_expression + "\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
 
     mysql_node.query("INSERT INTO test_database.test_table_2 VALUES(1, 2, 3, 4, 5), (6, 7, 8, 9, 10)")
-    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV", "1\t2\t3\t4\t5\n6\t7\t8\t9\t10\n")
+    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV",
+                "1\t2\t3\t4\t5\n6\t7\t8\t9\t10\n")
 
     clickhouse_node.query("DROP DATABASE test_database")
     mysql_node.query("DROP DATABASE test_database")
@@ -209,22 +224,28 @@ def alter_add_column_with_materialize_mysql_database(clickhouse_node, mysql_node
 
 def alter_drop_column_with_materialize_mysql_database(clickhouse_node, mysql_node, service_name):
     mysql_node.query("CREATE DATABASE test_database DEFAULT CHARACTER SET 'utf8'")
-    mysql_node.query("CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, drop_column INT) ENGINE = InnoDB;")
+    mysql_node.query(
+        "CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, drop_column INT) ENGINE = InnoDB;")
 
     mysql_node.query("ALTER TABLE test_database.test_table_1 DROP COLUMN drop_column")
 
     # create mapping
     clickhouse_node.query(
-        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV", "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
-    mysql_node.query("CREATE TABLE test_database.test_table_2 (id INT NOT NULL PRIMARY KEY, drop_column INT NOT NULL) ENGINE = InnoDB;")
+    check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    mysql_node.query(
+        "CREATE TABLE test_database.test_table_2 (id INT NOT NULL PRIMARY KEY, drop_column INT NOT NULL) ENGINE = InnoDB;")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\ntest_table_2\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "id\tInt32\t\t\t\t\t\ndrop_column\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\ndrop_column\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
     mysql_node.query("ALTER TABLE test_database.test_table_2 DROP COLUMN drop_column")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
 
     mysql_node.query("INSERT INTO test_database.test_table_2 VALUES(1), (2), (3), (4), (5)")
     check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV", "1\n2\n3\n4\n5\n")
@@ -237,25 +258,32 @@ def alter_rename_column_with_materialize_mysql_database(clickhouse_node, mysql_n
     mysql_node.query("CREATE DATABASE test_database DEFAULT CHARACTER SET 'utf8'")
 
     # maybe should test rename primary key?
-    mysql_node.query("CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, rename_column INT NOT NULL) ENGINE = InnoDB;")
+    mysql_node.query(
+        "CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, rename_column INT NOT NULL) ENGINE = InnoDB;")
 
     mysql_node.query("ALTER TABLE test_database.test_table_1 RENAME COLUMN rename_column TO new_column_name")
 
     # create mapping
     clickhouse_node.query(
-        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV", "id\tInt32\t\t\t\t\t\nnew_column_name\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
-    mysql_node.query("CREATE TABLE test_database.test_table_2 (id INT NOT NULL PRIMARY KEY, rename_column INT NOT NULL) ENGINE = InnoDB;")
+    check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\nnew_column_name\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    mysql_node.query(
+        "CREATE TABLE test_database.test_table_2 (id INT NOT NULL PRIMARY KEY, rename_column INT NOT NULL) ENGINE = InnoDB;")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\ntest_table_2\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "id\tInt32\t\t\t\t\t\nrename_column\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\nrename_column\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
     mysql_node.query("ALTER TABLE test_database.test_table_2 RENAME COLUMN rename_column TO new_column_name")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "id\tInt32\t\t\t\t\t\nnew_column_name\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\nnew_column_name\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
 
     mysql_node.query("INSERT INTO test_database.test_table_2 VALUES(1, 2), (3, 4), (5, 6), (7, 8), (9, 10)")
-    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV", "1\t2\n3\t4\n5\t6\n7\t8\n9\t10\n")
+    check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV",
+                "1\t2\n3\t4\n5\t6\n7\t8\n9\t10\n")
 
     clickhouse_node.query("DROP DATABASE test_database")
     mysql_node.query("DROP DATABASE test_database")
@@ -265,26 +293,34 @@ def alter_modify_column_with_materialize_mysql_database(clickhouse_node, mysql_n
     mysql_node.query("CREATE DATABASE test_database DEFAULT CHARACTER SET 'utf8'")
 
     # maybe should test rename primary key?
-    mysql_node.query("CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, modify_column INT NOT NULL) ENGINE = InnoDB;")
+    mysql_node.query(
+        "CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, modify_column INT NOT NULL) ENGINE = InnoDB;")
 
     mysql_node.query("ALTER TABLE test_database.test_table_1 MODIFY COLUMN modify_column INT")
 
     # create mapping
     clickhouse_node.query(
-        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV", "id\tInt32\t\t\t\t\t\nmodify_column\tNullable(Int32)\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
-    mysql_node.query("CREATE TABLE test_database.test_table_2 (id INT NOT NULL PRIMARY KEY, modify_column INT NOT NULL) ENGINE = InnoDB;")
+    check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\nmodify_column\tNullable(Int32)\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    mysql_node.query(
+        "CREATE TABLE test_database.test_table_2 (id INT NOT NULL PRIMARY KEY, modify_column INT NOT NULL) ENGINE = InnoDB;")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\ntest_table_2\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "id\tInt32\t\t\t\t\t\nmodify_column\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\nmodify_column\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
     mysql_node.query("ALTER TABLE test_database.test_table_2 MODIFY COLUMN modify_column INT")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "id\tInt32\t\t\t\t\t\nmodify_column\tNullable(Int32)\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\nmodify_column\tNullable(Int32)\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
     mysql_node.query("ALTER TABLE test_database.test_table_2 MODIFY COLUMN modify_column INT FIRST")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "modify_column\tNullable(Int32)\t\t\t\t\t\nid\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "modify_column\tNullable(Int32)\t\t\t\t\t\nid\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
     mysql_node.query("ALTER TABLE test_database.test_table_2 MODIFY COLUMN modify_column INT AFTER id")
-    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV", "id\tInt32\t\t\t\t\t\nmodify_column\tNullable(Int32)\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_2 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\nmodify_column\tNullable(Int32)\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
 
     mysql_node.query("INSERT INTO test_database.test_table_2 VALUES(1, 2), (3, NULL)")
     check_query(clickhouse_node, "SELECT * FROM test_database.test_table_2 ORDER BY id FORMAT TSV", "1\t2\n3\t\\N\n")
@@ -299,23 +335,31 @@ def alter_modify_column_with_materialize_mysql_database(clickhouse_node, mysql_n
 
 def alter_rename_table_with_materialize_mysql_database(clickhouse_node, mysql_node, service_name):
     mysql_node.query("CREATE DATABASE test_database DEFAULT CHARACTER SET 'utf8'")
-    mysql_node.query("CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, drop_column INT) ENGINE = InnoDB;")
+    mysql_node.query(
+        "CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, drop_column INT) ENGINE = InnoDB;")
 
-    mysql_node.query("ALTER TABLE test_database.test_table_1 DROP COLUMN drop_column, RENAME TO test_database.test_table_2, RENAME TO test_database.test_table_3")
+    mysql_node.query(
+        "ALTER TABLE test_database.test_table_1 DROP COLUMN drop_column, RENAME TO test_database.test_table_2, RENAME TO test_database.test_table_3")
 
     # create mapping
     clickhouse_node.query(
-        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(service_name))
+        "CREATE DATABASE test_database ENGINE = MaterializeMySQL('{}:3306', 'test_database', 'root', 'clickhouse')".format(
+            service_name))
 
     assert "test_database" in clickhouse_node.query("SHOW DATABASES")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_3\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_3 FORMAT TSV", "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
-    mysql_node.query("CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, drop_column INT NOT NULL) ENGINE = InnoDB;")
+    check_query(clickhouse_node, "DESC test_database.test_table_3 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    mysql_node.query(
+        "CREATE TABLE test_database.test_table_1 (id INT NOT NULL PRIMARY KEY, drop_column INT NOT NULL) ENGINE = InnoDB;")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_1\ntest_table_3\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV", "id\tInt32\t\t\t\t\t\ndrop_column\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
-    mysql_node.query("ALTER TABLE test_database.test_table_1 DROP COLUMN drop_column, RENAME TO test_database.test_table_2, RENAME TO test_database.test_table_4")
+    check_query(clickhouse_node, "DESC test_database.test_table_1 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\ndrop_column\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    mysql_node.query(
+        "ALTER TABLE test_database.test_table_1 DROP COLUMN drop_column, RENAME TO test_database.test_table_2, RENAME TO test_database.test_table_4")
     check_query(clickhouse_node, "SHOW TABLES FROM test_database FORMAT TSV", "test_table_3\ntest_table_4\n")
-    check_query(clickhouse_node, "DESC test_database.test_table_4 FORMAT TSV", "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
+    check_query(clickhouse_node, "DESC test_database.test_table_4 FORMAT TSV",
+                "id\tInt32\t\t\t\t\t\n_sign\tInt8\tMATERIALIZED\t1\t\t\t\n_version\tUInt64\tMATERIALIZED\t1\t\t\t\n")
 
     mysql_node.query("INSERT INTO test_database.test_table_4 VALUES(1), (2), (3), (4), (5)")
     check_query(clickhouse_node, "SELECT * FROM test_database.test_table_4 ORDER BY id FORMAT TSV", "1\n2\n3\n4\n5\n")
@@ -323,6 +367,7 @@ def alter_rename_table_with_materialize_mysql_database(clickhouse_node, mysql_no
     clickhouse_node.query("DROP DATABASE test_database")
     mysql_node.query("DROP DATABASE test_database")
 
+
 def query_event_with_empty_transaction(clickhouse_node, mysql_node, service_name):
     mysql_node.query("CREATE DATABASE test_database")
 
diff --git a/tests/integration/test_materialize_mysql_database/test.py b/tests/integration/test_materialize_mysql_database/test.py
index c00b310436d..c7314fb50d9 100644
--- a/tests/integration/test_materialize_mysql_database/test.py
+++ b/tests/integration/test_materialize_mysql_database/test.py
@@ -4,9 +4,9 @@ import time
 
 import pymysql.cursors
 import pytest
+from helpers.cluster import ClickHouseCluster, get_docker_compose_path
 
 import materialize_with_ddl
-from helpers.cluster import ClickHouseCluster, get_docker_compose_path
 
 DOCKER_COMPOSE_PATH = get_docker_compose_path()
 
@@ -33,7 +33,8 @@ class MySQLNodeInstance:
 
     def alloc_connection(self):
         if self.mysql_connection is None:
-            self.mysql_connection = pymysql.connect(user=self.user, password=self.password, host=self.hostname, port=self.port, autocommit=True)
+            self.mysql_connection = pymysql.connect(user=self.user, password=self.password, host=self.hostname,
+                                                    port=self.port, autocommit=True)
         return self.mysql_connection
 
     def query(self, execution_query):
@@ -65,12 +66,14 @@ def started_mysql_5_7():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_mysql.yml')
 
     try:
-        subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d'])
+        subprocess.check_call(
+            ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d'])
         mysql_node.wait_mysql_to_start(120)
         yield mysql_node
     finally:
         mysql_node.close()
-        subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'down', '--volumes', '--remove-orphans'])
+        subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'down', '--volumes',
+                               '--remove-orphans'])
 
 
 @pytest.fixture(scope="module")
@@ -79,12 +82,14 @@ def started_mysql_8_0():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_mysql_8_0.yml')
 
     try:
-        subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d'])
+        subprocess.check_call(
+            ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d'])
         mysql_node.wait_mysql_to_start(120)
         yield mysql_node
     finally:
         mysql_node.close()
-        subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'down', '--volumes', '--remove-orphans'])
+        subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'down', '--volumes',
+                               '--remove-orphans'])
 
 
 def test_materialize_database_dml_with_mysql_5_7(started_cluster, started_mysql_5_7):
@@ -94,19 +99,25 @@ def test_materialize_database_dml_with_mysql_5_7(started_cluster, started_mysql_
 def test_materialize_database_dml_with_mysql_8_0(started_cluster, started_mysql_8_0):
     materialize_with_ddl.dml_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
 
+
 def test_materialize_database_ddl_with_mysql_5_7(started_cluster, started_mysql_5_7):
     try:
         materialize_with_ddl.drop_table_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7, "mysql1")
         materialize_with_ddl.create_table_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7, "mysql1")
         materialize_with_ddl.rename_table_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7, "mysql1")
-        materialize_with_ddl.alter_add_column_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7, "mysql1")
-        materialize_with_ddl.alter_drop_column_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7, "mysql1")
+        materialize_with_ddl.alter_add_column_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7,
+                                                                              "mysql1")
+        materialize_with_ddl.alter_drop_column_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7,
+                                                                               "mysql1")
         # mysql 5.7 cannot support alter rename column
         # materialize_with_ddl.alter_rename_column_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7, "mysql1")
-        materialize_with_ddl.alter_rename_table_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7, "mysql1")
-        materialize_with_ddl.alter_modify_column_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7, "mysql1")
+        materialize_with_ddl.alter_rename_table_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7,
+                                                                                "mysql1")
+        materialize_with_ddl.alter_modify_column_with_materialize_mysql_database(clickhouse_node, started_mysql_5_7,
+                                                                                 "mysql1")
     except:
-        print(clickhouse_node.query("select '\n', thread_id, query_id, arrayStringConcat(arrayMap(x -> concat(demangle(addressToSymbol(x)), '\n    ', addressToLine(x)), trace), '\n') AS sym from system.stack_trace format TSVRaw"))
+        print(clickhouse_node.query(
+            "select '\n', thread_id, query_id, arrayStringConcat(arrayMap(x -> concat(demangle(addressToSymbol(x)), '\n    ', addressToLine(x)), trace), '\n') AS sym from system.stack_trace format TSVRaw"))
         raise
 
 
@@ -114,14 +125,21 @@ def test_materialize_database_ddl_with_mysql_8_0(started_cluster, started_mysql_
     materialize_with_ddl.drop_table_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
     materialize_with_ddl.create_table_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
     materialize_with_ddl.rename_table_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
-    materialize_with_ddl.alter_add_column_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
-    materialize_with_ddl.alter_drop_column_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
-    materialize_with_ddl.alter_rename_table_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
-    materialize_with_ddl.alter_rename_column_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
-    materialize_with_ddl.alter_modify_column_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0, "mysql8_0")
+    materialize_with_ddl.alter_add_column_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0,
+                                                                          "mysql8_0")
+    materialize_with_ddl.alter_drop_column_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0,
+                                                                           "mysql8_0")
+    materialize_with_ddl.alter_rename_table_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0,
+                                                                            "mysql8_0")
+    materialize_with_ddl.alter_rename_column_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0,
+                                                                             "mysql8_0")
+    materialize_with_ddl.alter_modify_column_with_materialize_mysql_database(clickhouse_node, started_mysql_8_0,
+                                                                             "mysql8_0")
+
 
 def test_materialize_database_ddl_with_empty_transaction_5_7(started_cluster, started_mysql_5_7):
     materialize_with_ddl.query_event_with_empty_transaction(clickhouse_node, started_mysql_5_7, "mysql1")
 
+
 def test_materialize_database_ddl_with_empty_transaction_8_0(started_cluster, started_mysql_8_0):
     materialize_with_ddl.query_event_with_empty_transaction(clickhouse_node, started_mysql_8_0, "mysql8_0")
diff --git a/tests/integration/test_max_http_connections_for_replication/test.py b/tests/integration/test_max_http_connections_for_replication/test.py
index 0317aa19cc3..5ef45c2a893 100644
--- a/tests/integration/test_max_http_connections_for_replication/test.py
+++ b/tests/integration/test_max_http_connections_for_replication/test.py
@@ -1,29 +1,33 @@
 import time
-import pytest
-
-from helpers.cluster import ClickHouseCluster
 from multiprocessing.dummy import Pool
 
+import pytest
+from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
+
 def _fill_nodes(nodes, shard, connections_count):
     for node in nodes:
         node.query(
-        '''
-            CREATE DATABASE test;
+            '''
+                CREATE DATABASE test;
+    
+                CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}')
+                PARTITION BY date
+                ORDER BY id
+                SETTINGS
+                    replicated_max_parallel_fetches_for_host={connections},
+                    index_granularity=8192;
+            '''.format(shard=shard, replica=node.name, connections=connections_count))
 
-            CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}')
-            PARTITION BY date
-            ORDER BY id
-            SETTINGS
-                replicated_max_parallel_fetches_for_host={connections},
-                index_granularity=8192;
-        '''.format(shard=shard, replica=node.name, connections=connections_count))
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', user_configs=[], main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
-node2 = cluster.add_instance('node2', user_configs=[], main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+node1 = cluster.add_instance('node1', user_configs=[],
+                             main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+node2 = cluster.add_instance('node2', user_configs=[],
+                             main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def start_small_cluster():
@@ -37,8 +41,8 @@ def start_small_cluster():
     finally:
         cluster.shutdown()
 
-def test_single_endpoint_connections_count(start_small_cluster):
 
+def test_single_endpoint_connections_count(start_small_cluster):
     def task(count):
         print("Inserting ten times from {}".format(count))
         for i in xrange(count, count + 10):
@@ -52,6 +56,7 @@ def test_single_endpoint_connections_count(start_small_cluster):
 
     assert node2.query("SELECT value FROM system.events where event='CreatedHTTPConnections'") == '1\n'
 
+
 def test_keepalive_timeout(start_small_cluster):
     current_count = int(node1.query("select count() from test_table").strip())
     node1.query("insert into test_table values ('2017-06-16', 777, 0)")
@@ -68,9 +73,14 @@ def test_keepalive_timeout(start_small_cluster):
 
     assert not node2.contains_in_log("No message received"), "Found 'No message received' in clickhouse-server.log"
 
-node3 = cluster.add_instance('node3', user_configs=[], main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
-node4 = cluster.add_instance('node4', user_configs=[], main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
-node5 = cluster.add_instance('node5', user_configs=[], main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+
+node3 = cluster.add_instance('node3', user_configs=[],
+                             main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+node4 = cluster.add_instance('node4', user_configs=[],
+                             main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+node5 = cluster.add_instance('node5', user_configs=[],
+                             main_configs=['configs/remote_servers.xml', 'configs/log_conf.xml'], with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def start_big_cluster():
@@ -84,8 +94,8 @@ def start_big_cluster():
     finally:
         cluster.shutdown()
 
-def test_multiple_endpoint_connections_count(start_big_cluster):
 
+def test_multiple_endpoint_connections_count(start_big_cluster):
     def task(count):
         print("Inserting ten times from {}".format(count))
         if (count / 10) % 2 == 1:
diff --git a/tests/integration/test_merge_table_over_distributed/test.py b/tests/integration/test_merge_table_over_distributed/test.py
index b52a605943b..2e73bd09ded 100644
--- a/tests/integration/test_merge_table_over_distributed/test.py
+++ b/tests/integration/test_merge_table_over_distributed/test.py
@@ -1,7 +1,6 @@
 from contextlib import contextmanager
 
 import pytest
-
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
@@ -9,6 +8,7 @@ cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'])
 node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'])
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -36,28 +36,29 @@ CREATE TABLE merge_table(id UInt32, val String) ENGINE = Merge(default, '^distri
 
 
 def test_global_in(started_cluster):
-    assert node1.query("SELECT val FROM distributed_table WHERE id GLOBAL IN (SELECT toUInt32(3 - id) FROM local_table)").rstrip() \
-        == 'node2'
+    assert node1.query(
+        "SELECT val FROM distributed_table WHERE id GLOBAL IN (SELECT toUInt32(3 - id) FROM local_table)").rstrip() \
+           == 'node2'
 
-    assert node1.query("SELECT val FROM merge_table WHERE id GLOBAL IN (SELECT toUInt32(3 - id) FROM local_table)").rstrip() \
-        == 'node2'
+    assert node1.query(
+        "SELECT val FROM merge_table WHERE id GLOBAL IN (SELECT toUInt32(3 - id) FROM local_table)").rstrip() \
+           == 'node2'
 
 
 def test_filtering(started_cluster):
-
     assert node1.query("SELECT id, val FROM merge_table WHERE id = 1").rstrip() == '1\tnode1'
 
     assert node1.query("SELECT id + 1, val FROM merge_table WHERE id = 1").rstrip() == '2\tnode1'
 
     assert node1.query("SELECT id + 1 FROM merge_table WHERE val = 'node1'").rstrip() == '2'
 
-    assert node1.query("SELECT id + 1, val FROM merge_table PREWHERE id = 1 WHERE _table != '_dummy'").rstrip() == '2\tnode1'
+    assert node1.query(
+        "SELECT id + 1, val FROM merge_table PREWHERE id = 1 WHERE _table != '_dummy'").rstrip() == '2\tnode1'
 
     assert node1.query("SELECT count() FROM merge_table PREWHERE id = 1").rstrip() == '1'
 
 
 def test_select_table_name_from_merge_over_distributed(started_cluster):
-
     node1.query("INSERT INTO local_table_2 VALUES (1, 'node1')")
     node2.query("INSERT INTO local_table_2 VALUES (2, 'node2')")
 
diff --git a/tests/integration/test_merge_tree_s3/test.py b/tests/integration/test_merge_tree_s3/test.py
index c4e7bbefd87..7acb8c5fe00 100644
--- a/tests/integration/test_merge_tree_s3/test.py
+++ b/tests/integration/test_merge_tree_s3/test.py
@@ -14,7 +14,9 @@ logging.getLogger().addHandler(logging.StreamHandler())
 def cluster():
     try:
         cluster = ClickHouseCluster(__file__)
-        cluster.add_instance("node", main_configs=["configs/config.d/storage_conf.xml", "configs/config.d/bg_processing_pool_conf.xml", "configs/config.d/log_conf.xml"], user_configs=[], with_minio=True)
+        cluster.add_instance("node", main_configs=["configs/config.d/storage_conf.xml",
+                                                   "configs/config.d/bg_processing_pool_conf.xml",
+                                                   "configs/config.d/log_conf.xml"], user_configs=[], with_minio=True)
         logging.info("Starting cluster...")
         cluster.start()
         logging.info("Cluster started")
@@ -36,7 +38,7 @@ def random_string(length):
 
 
 def generate_values(date_str, count, sign=1):
-    data = [[date_str, sign*(i + 1), random_string(10)] for i in range(count)]
+    data = [[date_str, sign * (i + 1), random_string(10)] for i in range(count)]
     data.sort(key=lambda tup: tup[1])
     return ",".join(["('{}',{},'{}')".format(x, y, z) for x, y, z in data])
 
@@ -103,7 +105,7 @@ def test_simple_insert_select(cluster, min_rows_for_wide_part, files_per_part):
     values2 = generate_values('2020-01-04', 4096)
     node.query("INSERT INTO s3_test VALUES {}".format(values2))
     assert node.query("SELECT * FROM s3_test ORDER BY dt, id FORMAT Values") == values1 + "," + values2
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + files_per_part*2
+    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + files_per_part * 2
 
     assert node.query("SELECT count(*) FROM s3_test where id = 1 FORMAT Values") == "(2)"
 
@@ -132,7 +134,8 @@ def test_insert_same_partition_and_merge(cluster, merge_vertical):
     node.query("INSERT INTO s3_test VALUES {}".format(generate_values('2020-01-03', 4096, -1)))
     assert node.query("SELECT sum(id) FROM s3_test FORMAT Values") == "(0)"
     assert node.query("SELECT count(distinct(id)) FROM s3_test FORMAT Values") == "(8192)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD_PER_PART_WIDE*6 + FILES_OVERHEAD
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD_PER_PART_WIDE * 6 + FILES_OVERHEAD
 
     node.query("SYSTEM START MERGES s3_test")
     # Wait for merges and old parts deletion
@@ -161,7 +164,8 @@ def test_alter_table_columns(cluster):
 
     assert node.query("SELECT sum(col1) FROM s3_test FORMAT Values") == "(8192)"
     assert node.query("SELECT sum(col1) FROM s3_test WHERE id > 0 FORMAT Values") == "(4096)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE + FILES_OVERHEAD_PER_COLUMN
+    assert len(list(minio.list_objects(cluster.minio_bucket,
+                                       'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE + FILES_OVERHEAD_PER_COLUMN
 
     node.query("ALTER TABLE s3_test MODIFY COLUMN col1 String", settings={"mutations_sync": 2})
 
@@ -170,7 +174,8 @@ def test_alter_table_columns(cluster):
 
     assert node.query("SELECT distinct(col1) FROM s3_test FORMAT Values") == "('1')"
     # and file with mutation
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == (FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE + FILES_OVERHEAD_PER_COLUMN + 1)
+    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == (
+            FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE + FILES_OVERHEAD_PER_COLUMN + 1)
 
     node.query("ALTER TABLE s3_test DROP COLUMN col1", settings={"mutations_sync": 2})
 
@@ -178,7 +183,8 @@ def test_alter_table_columns(cluster):
     time.sleep(3)
 
     # and 2 files with mutations
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE + 2
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE + 2
 
 
 def test_attach_detach_partition(cluster):
@@ -190,15 +196,18 @@ def test_attach_detach_partition(cluster):
     node.query("INSERT INTO s3_test VALUES {}".format(generate_values('2020-01-03', 4096)))
     node.query("INSERT INTO s3_test VALUES {}".format(generate_values('2020-01-04', 4096)))
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(8192)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*2
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
 
     node.query("ALTER TABLE s3_test DETACH PARTITION '2020-01-03'")
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(4096)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*2
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
 
     node.query("ALTER TABLE s3_test ATTACH PARTITION '2020-01-03'")
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(8192)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*2
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
 
     node.query("ALTER TABLE s3_test DROP PARTITION '2020-01-03'")
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(4096)"
@@ -219,7 +228,8 @@ def test_move_partition_to_another_disk(cluster):
     node.query("INSERT INTO s3_test VALUES {}".format(generate_values('2020-01-03', 4096)))
     node.query("INSERT INTO s3_test VALUES {}".format(generate_values('2020-01-04', 4096)))
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(8192)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*2
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
 
     node.query("ALTER TABLE s3_test MOVE PARTITION '2020-01-04' TO DISK 'hdd'")
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(8192)"
@@ -227,7 +237,8 @@ def test_move_partition_to_another_disk(cluster):
 
     node.query("ALTER TABLE s3_test MOVE PARTITION '2020-01-04' TO DISK 's3'")
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(8192)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*2
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
 
 
 def test_table_manipulations(cluster):
@@ -241,7 +252,8 @@ def test_table_manipulations(cluster):
 
     node.query("RENAME TABLE s3_test TO s3_renamed")
     assert node.query("SELECT count(*) FROM s3_renamed FORMAT Values") == "(8192)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*2
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
     node.query("RENAME TABLE s3_renamed TO s3_test")
 
     assert node.query("CHECK TABLE s3_test FORMAT Values") == "(1)"
@@ -249,7 +261,8 @@ def test_table_manipulations(cluster):
     node.query("DETACH TABLE s3_test")
     node.query("ATTACH TABLE s3_test")
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(8192)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*2
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 2
 
     node.query("TRUNCATE TABLE s3_test")
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(0)"
@@ -268,7 +281,8 @@ def test_move_replace_partition_to_another_table(cluster):
     node.query("INSERT INTO s3_test VALUES {}".format(generate_values('2020-01-06', 4096, -1)))
     assert node.query("SELECT sum(id) FROM s3_test FORMAT Values") == "(0)"
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(16384)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*4
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 4
 
     create_table(cluster, "s3_clone")
 
@@ -279,14 +293,16 @@ def test_move_replace_partition_to_another_table(cluster):
     assert node.query("SELECT sum(id) FROM s3_clone FORMAT Values") == "(0)"
     assert node.query("SELECT count(*) FROM s3_clone FORMAT Values") == "(8192)"
     # Number of objects in S3 should be unchanged.
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD*2 + FILES_OVERHEAD_PER_PART_WIDE*4
+    assert len(list(
+        minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD * 2 + FILES_OVERHEAD_PER_PART_WIDE * 4
 
     # Add new partitions to source table, but with different values and replace them from copied table.
     node.query("INSERT INTO s3_test VALUES {}".format(generate_values('2020-01-03', 4096, -1)))
     node.query("INSERT INTO s3_test VALUES {}".format(generate_values('2020-01-05', 4096)))
     assert node.query("SELECT sum(id) FROM s3_test FORMAT Values") == "(0)"
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(16384)"
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD*2 + FILES_OVERHEAD_PER_PART_WIDE*6
+    assert len(list(
+        minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD * 2 + FILES_OVERHEAD_PER_PART_WIDE * 6
 
     node.query("ALTER TABLE s3_test REPLACE PARTITION '2020-01-03' FROM s3_clone")
     node.query("ALTER TABLE s3_test REPLACE PARTITION '2020-01-05' FROM s3_clone")
@@ -297,23 +313,26 @@ def test_move_replace_partition_to_another_table(cluster):
 
     # Wait for outdated partitions deletion.
     time.sleep(3)
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD*2 + FILES_OVERHEAD_PER_PART_WIDE*4
+    assert len(list(
+        minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD * 2 + FILES_OVERHEAD_PER_PART_WIDE * 4
 
     node.query("DROP TABLE s3_clone NO DELAY")
     time.sleep(1)
     assert node.query("SELECT sum(id) FROM s3_test FORMAT Values") == "(0)"
     assert node.query("SELECT count(*) FROM s3_test FORMAT Values") == "(16384)"
     # Data should remain in S3
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*4
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 4
 
     node.query("ALTER TABLE s3_test FREEZE")
     # Number S3 objects should be unchanged.
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE*4
+    assert len(
+        list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD + FILES_OVERHEAD_PER_PART_WIDE * 4
 
     node.query("DROP TABLE s3_test NO DELAY")
     time.sleep(1)
     # Backup data should remain in S3.
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD_PER_PART_WIDE*4
+    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == FILES_OVERHEAD_PER_PART_WIDE * 4
 
     for obj in list(minio.list_objects(cluster.minio_bucket, 'data/')):
         minio.remove_object(cluster.minio_bucket, obj.object_name)
diff --git a/tests/integration/test_multiple_disks/test.py b/tests/integration/test_multiple_disks/test.py
index 8a4c0a9c30f..d12c7f7b357 100644
--- a/tests/integration/test_multiple_disks/test.py
+++ b/tests/integration/test_multiple_disks/test.py
@@ -1,30 +1,32 @@
 import json
-import pytest
 import random
 import re
 import string
 import threading
 import time
 from multiprocessing.dummy import Pool
+
+import pytest
 from helpers.client import QueryRuntimeException
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
 
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1',
-            main_configs=['configs/logs_config.xml', 'configs/config.d/storage_configuration.xml', 'configs/config.d/cluster.xml'],
-            with_zookeeper=True,
-            stay_alive=True,
-            tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/external:size=200M'],
-            macros={"shard": 0, "replica": 1} )
+                             main_configs=['configs/logs_config.xml', 'configs/config.d/storage_configuration.xml',
+                                           'configs/config.d/cluster.xml'],
+                             with_zookeeper=True,
+                             stay_alive=True,
+                             tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/external:size=200M'],
+                             macros={"shard": 0, "replica": 1})
 
 node2 = cluster.add_instance('node2',
-            main_configs=['configs/logs_config.xml', 'configs/config.d/storage_configuration.xml', 'configs/config.d/cluster.xml'],
-            with_zookeeper=True,
-            stay_alive=True,
-            tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/external:size=200M'],
-            macros={"shard": 0, "replica": 2} )
+                             main_configs=['configs/logs_config.xml', 'configs/config.d/storage_configuration.xml',
+                                           'configs/config.d/cluster.xml'],
+                             with_zookeeper=True,
+                             stay_alive=True,
+                             tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/external:size=200M'],
+                             macros={"shard": 0, "replica": 2})
 
 
 @pytest.fixture(scope="module")
@@ -38,7 +40,6 @@ def start_cluster():
 
 
 def test_system_tables(start_cluster):
-
     expected_disks_data = [
         {
             "name": "default",
@@ -62,7 +63,8 @@ def test_system_tables(start_cluster):
         }
     ]
 
-    click_disk_data = json.loads(node1.query("SELECT name, path, keep_free_space FROM system.disks FORMAT JSON"))["data"]
+    click_disk_data = json.loads(node1.query("SELECT name, path, keep_free_space FROM system.disks FORMAT JSON"))[
+        "data"]
     assert sorted(click_disk_data, key=lambda x: x["name"]) == sorted(expected_disks_data, key=lambda x: x["name"])
 
     expected_policies_data = [
@@ -194,7 +196,9 @@ def test_system_tables(start_cluster):
         },
     ]
 
-    clickhouse_policies_data = json.loads(node1.query("SELECT * FROM system.storage_policies WHERE policy_name != 'default' FORMAT JSON"))["data"]
+    clickhouse_policies_data = \
+        json.loads(node1.query("SELECT * FROM system.storage_policies WHERE policy_name != 'default' FORMAT JSON"))[
+            "data"]
 
     def key(x):
         return (x["policy_name"], x["volume_name"], x["volume_priority"])
@@ -222,7 +226,6 @@ def test_query_parser(start_cluster):
                 SETTINGS storage_policy='jbod1'
             """)
 
-
         node1.query("""
                 CREATE TABLE table_with_normal_policy (
                     d UInt64
@@ -246,14 +249,15 @@ def test_query_parser(start_cluster):
             node1.query("ALTER TABLE table_with_normal_policy MOVE PARTITION 'yyyy' TO DISK 'jbod1'")
 
         with pytest.raises(QueryRuntimeException):
-            node1.query("ALTER TABLE table_with_normal_policy MODIFY SETTING storage_policy='moving_jbod_with_external'")
+            node1.query(
+                "ALTER TABLE table_with_normal_policy MODIFY SETTING storage_policy='moving_jbod_with_external'")
     finally:
         node1.query("DROP TABLE IF EXISTS table_with_normal_policy")
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("test_alter_policy","MergeTree()"),
-    ("replicated_test_alter_policy","ReplicatedMergeTree('/clickhouse/test_alter_policy', '1')",),
+    ("test_alter_policy", "MergeTree()"),
+    ("replicated_test_alter_policy", "ReplicatedMergeTree('/clickhouse/test_alter_policy', '1')",),
 ])
 def test_alter_policy(start_cluster, name, engine):
     try:
@@ -265,21 +269,28 @@ def test_alter_policy(start_cluster, name, engine):
             SETTINGS storage_policy='small_jbod_with_external'
         """.format(name=name, engine=engine))
 
-        assert node1.query("""SELECT storage_policy FROM system.tables WHERE name = '{name}'""".format(name=name)) == "small_jbod_with_external\n"
+        assert node1.query("""SELECT storage_policy FROM system.tables WHERE name = '{name}'""".format(
+            name=name)) == "small_jbod_with_external\n"
 
         with pytest.raises(QueryRuntimeException):
-            node1.query("""ALTER TABLE {name} MODIFY SETTING storage_policy='one_more_small_jbod_with_external'""".format(name=name))
+            node1.query(
+                """ALTER TABLE {name} MODIFY SETTING storage_policy='one_more_small_jbod_with_external'""".format(
+                    name=name))
 
-        assert node1.query("""SELECT storage_policy FROM system.tables WHERE name = '{name}'""".format(name=name)) == "small_jbod_with_external\n"
+        assert node1.query("""SELECT storage_policy FROM system.tables WHERE name = '{name}'""".format(
+            name=name)) == "small_jbod_with_external\n"
 
         node1.query("""ALTER TABLE {name} MODIFY SETTING storage_policy='jbods_with_external'""".format(name=name))
 
-        assert node1.query("""SELECT storage_policy FROM system.tables WHERE name = '{name}'""".format(name=name)) == "jbods_with_external\n"
+        assert node1.query("""SELECT storage_policy FROM system.tables WHERE name = '{name}'""".format(
+            name=name)) == "jbods_with_external\n"
 
         with pytest.raises(QueryRuntimeException):
-            node1.query("""ALTER TABLE {name} MODIFY SETTING storage_policy='small_jbod_with_external'""".format(name=name))
+            node1.query(
+                """ALTER TABLE {name} MODIFY SETTING storage_policy='small_jbod_with_external'""".format(name=name))
 
-        assert node1.query("""SELECT storage_policy FROM system.tables WHERE name = '{name}'""".format(name=name)) == "jbods_with_external\n"
+        assert node1.query("""SELECT storage_policy FROM system.tables WHERE name = '{name}'""".format(
+            name=name)) == "jbods_with_external\n"
 
     finally:
         node1.query("DROP TABLE IF EXISTS {name}".format(name=name))
@@ -288,8 +299,12 @@ def test_alter_policy(start_cluster, name, engine):
 def get_random_string(length):
     return ''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(length))
 
+
 def get_used_disks_for_table(node, table_name):
-    return node.query("select disk_name from system.parts where table == '{}' and active=1 order by modification_time".format(table_name)).strip().split('\n')
+    return node.query(
+        "select disk_name from system.parts where table == '{}' and active=1 order by modification_time".format(
+            table_name)).strip().split('\n')
+
 
 def test_no_warning_about_zero_max_data_part_size(start_cluster):
     def get_log(node):
@@ -314,8 +329,8 @@ def test_no_warning_about_zero_max_data_part_size(start_cluster):
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("mt_on_jbod","MergeTree()"),
-    ("replicated_mt_on_jbod","ReplicatedMergeTree('/clickhouse/replicated_mt_on_jbod', '1')",),
+    ("mt_on_jbod", "MergeTree()"),
+    ("replicated_mt_on_jbod", "ReplicatedMergeTree('/clickhouse/replicated_mt_on_jbod', '1')",),
 ])
 def test_round_robin(start_cluster, name, engine):
     try:
@@ -348,9 +363,10 @@ def test_round_robin(start_cluster, name, engine):
     finally:
         node1.query("DROP TABLE IF EXISTS {}".format(name))
 
+
 @pytest.mark.parametrize("name,engine", [
-    ("mt_with_huge_part","MergeTree()"),
-    ("replicated_mt_with_huge_part","ReplicatedMergeTree('/clickhouse/replicated_mt_with_huge_part', '1')",),
+    ("mt_with_huge_part", "MergeTree()"),
+    ("replicated_mt_with_huge_part", "ReplicatedMergeTree('/clickhouse/replicated_mt_with_huge_part', '1')",),
 ])
 def test_max_data_part_size(start_cluster, name, engine):
     try:
@@ -361,9 +377,9 @@ def test_max_data_part_size(start_cluster, name, engine):
             ORDER BY tuple()
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
-        data = [] # 10MB in total
+        data = []  # 10MB in total
         for i in range(10):
-            data.append(get_random_string(1024 * 1024)) # 1MB row
+            data.append(get_random_string(1024 * 1024))  # 1MB row
 
         node1.query("INSERT INTO {} VALUES {}".format(name, ','.join(["('" + x + "')" for x in data])))
         used_disks = get_used_disks_for_table(node1, name)
@@ -372,9 +388,10 @@ def test_max_data_part_size(start_cluster, name, engine):
     finally:
         node1.query("DROP TABLE IF EXISTS {}".format(name))
 
+
 @pytest.mark.parametrize("name,engine", [
-    ("mt_with_overflow","MergeTree()"),
-    ("replicated_mt_with_overflow","ReplicatedMergeTree('/clickhouse/replicated_mt_with_overflow', '1')",),
+    ("mt_with_overflow", "MergeTree()"),
+    ("replicated_mt_with_overflow", "ReplicatedMergeTree('/clickhouse/replicated_mt_with_overflow', '1')",),
 ])
 def test_jbod_overflow(start_cluster, name, engine):
     try:
@@ -390,18 +407,18 @@ def test_jbod_overflow(start_cluster, name, engine):
 
         # small jbod size is 40MB, so lets insert 5MB batch 7 times
         for i in range(7):
-            data = [] # 5MB in total
+            data = []  # 5MB in total
             for i in range(5):
-                data.append(get_random_string(1024 * 1024)) # 1MB row
+                data.append(get_random_string(1024 * 1024))  # 1MB row
             node1.query("INSERT INTO {} VALUES {}".format(name, ','.join(["('" + x + "')" for x in data])))
 
         used_disks = get_used_disks_for_table(node1, name)
         assert all(disk == 'jbod1' for disk in used_disks)
 
         # should go to the external disk (jbod is overflown)
-        data = [] # 10MB in total
+        data = []  # 10MB in total
         for i in range(10):
-            data.append(get_random_string(1024 * 1024)) # 1MB row
+            data.append(get_random_string(1024 * 1024))  # 1MB row
 
         node1.query("INSERT INTO {} VALUES {}".format(name, ','.join(["('" + x + "')" for x in data])))
 
@@ -415,16 +432,19 @@ def test_jbod_overflow(start_cluster, name, engine):
         node1.query("OPTIMIZE TABLE {} FINAL".format(name))
         time.sleep(2)
 
-        disks_for_merges = node1.query("SELECT disk_name FROM system.parts WHERE table == '{}' AND level >= 1 and active = 1 ORDER BY modification_time".format(name)).strip().split('\n')
+        disks_for_merges = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table == '{}' AND level >= 1 and active = 1 ORDER BY modification_time".format(
+                name)).strip().split('\n')
 
         assert all(disk == 'external' for disk in disks_for_merges)
 
     finally:
         node1.query("DROP TABLE IF EXISTS {}".format(name))
 
+
 @pytest.mark.parametrize("name,engine", [
-    ("moving_mt","MergeTree()"),
-    ("moving_replicated_mt","ReplicatedMergeTree('/clickhouse/moving_replicated_mt', '1')",),
+    ("moving_mt", "MergeTree()"),
+    ("moving_replicated_mt", "ReplicatedMergeTree('/clickhouse/moving_replicated_mt', '1')",),
 ])
 def test_background_move(start_cluster, name, engine):
     try:
@@ -437,13 +457,12 @@ def test_background_move(start_cluster, name, engine):
         """.format(name=name, engine=engine))
 
         for i in range(5):
-            data = [] # 5MB in total
+            data = []  # 5MB in total
             for i in range(5):
-                data.append(get_random_string(1024 * 1024)) # 1MB row
+                data.append(get_random_string(1024 * 1024))  # 1MB row
             # small jbod size is 40MB, so lets insert 5MB batch 5 times
             node1.query("INSERT INTO {} VALUES {}".format(name, ','.join(["('" + x + "')" for x in data])))
 
-
         used_disks = get_used_disks_for_table(node1, name)
 
         retry = 20
@@ -458,7 +477,9 @@ def test_background_move(start_cluster, name, engine):
         # first (oldest) part was moved to external
         assert used_disks[0] == 'external'
 
-        path = node1.query("SELECT path_on_disk FROM system.part_log WHERE table = '{}' AND event_type='MovePart' ORDER BY event_time LIMIT 1".format(name))
+        path = node1.query(
+            "SELECT path_on_disk FROM system.part_log WHERE table = '{}' AND event_type='MovePart' ORDER BY event_time LIMIT 1".format(
+                name))
 
         # first (oldest) part was moved to external
         assert path.startswith("/external")
@@ -466,9 +487,10 @@ def test_background_move(start_cluster, name, engine):
     finally:
         node1.query("DROP TABLE IF EXISTS {name}".format(name=name))
 
+
 @pytest.mark.parametrize("name,engine", [
-    ("stopped_moving_mt","MergeTree()"),
-    ("stopped_moving_replicated_mt","ReplicatedMergeTree('/clickhouse/stopped_moving_replicated_mt', '1')",),
+    ("stopped_moving_mt", "MergeTree()"),
+    ("stopped_moving_replicated_mt", "ReplicatedMergeTree('/clickhouse/stopped_moving_replicated_mt', '1')",),
 ])
 def test_start_stop_moves(start_cluster, name, engine):
     try:
@@ -486,7 +508,9 @@ def test_start_stop_moves(start_cluster, name, engine):
         used_disks = get_used_disks_for_table(node1, name)
         assert all(d == "jbod1" for d in used_disks), "All writes shoud go to jbods"
 
-        first_part = node1.query("SELECT name FROM system.parts WHERE table = '{}' and active = 1 ORDER BY modification_time LIMIT 1".format(name)).strip()
+        first_part = node1.query(
+            "SELECT name FROM system.parts WHERE table = '{}' and active = 1 ORDER BY modification_time LIMIT 1".format(
+                name)).strip()
 
         node1.query("SYSTEM STOP MOVES")
 
@@ -500,7 +524,9 @@ def test_start_stop_moves(start_cluster, name, engine):
 
         node1.query("ALTER TABLE {} MOVE PART '{}' TO VOLUME 'external'".format(name, first_part))
 
-        disk = node1.query("SELECT disk_name FROM system.parts WHERE table = '{}' and name = '{}' and active = 1".format(name, first_part)).strip()
+        disk = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{}' and name = '{}' and active = 1".format(name,
+                                                                                                          first_part)).strip()
 
         assert disk == "external"
 
@@ -510,9 +536,9 @@ def test_start_stop_moves(start_cluster, name, engine):
         node1.query("SYSTEM STOP MERGES {}".format(name))
 
         for i in range(5):
-            data = [] # 5MB in total
+            data = []  # 5MB in total
             for i in range(5):
-                data.append(get_random_string(1024 * 1024)) # 1MB row
+                data.append(get_random_string(1024 * 1024))  # 1MB row
             # jbod size is 40MB, so lets insert 5MB batch 7 times
             node1.query("INSERT INTO {} VALUES {}".format(name, ','.join(["('" + x + "')" for x in data])))
 
@@ -548,20 +574,26 @@ def test_start_stop_moves(start_cluster, name, engine):
     finally:
         node1.query("DROP TABLE IF EXISTS {name}".format(name=name))
 
+
 def get_path_for_part_from_part_log(node, table, part_name):
     node.query("SYSTEM FLUSH LOGS")
-    path = node.query("SELECT path_on_disk FROM system.part_log WHERE table = '{}' and part_name = '{}' ORDER BY event_time DESC LIMIT 1".format(table, part_name))
+    path = node.query(
+        "SELECT path_on_disk FROM system.part_log WHERE table = '{}' and part_name = '{}' ORDER BY event_time DESC LIMIT 1".format(
+            table, part_name))
     return path.strip()
 
+
 def get_paths_for_partition_from_part_log(node, table, partition_id):
     node.query("SYSTEM FLUSH LOGS")
-    paths = node.query("SELECT path_on_disk FROM system.part_log WHERE table = '{}' and partition_id = '{}' ORDER BY event_time DESC".format(table, partition_id))
+    paths = node.query(
+        "SELECT path_on_disk FROM system.part_log WHERE table = '{}' and partition_id = '{}' ORDER BY event_time DESC".format(
+            table, partition_id))
     return paths.strip().split('\n')
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("altering_mt","MergeTree()"),
-    #("altering_replicated_mt","ReplicatedMergeTree('/clickhouse/altering_replicated_mt', '1')",),
+    ("altering_mt", "MergeTree()"),
+    # ("altering_replicated_mt","ReplicatedMergeTree('/clickhouse/altering_replicated_mt', '1')",),
     # SYSTEM STOP MERGES doesn't disable merges assignments
 ])
 def test_alter_move(start_cluster, name, engine):
@@ -576,7 +608,7 @@ def test_alter_move(start_cluster, name, engine):
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
 
-        node1.query("SYSTEM STOP MERGES {}".format(name)) # to avoid conflicts
+        node1.query("SYSTEM STOP MERGES {}".format(name))  # to avoid conflicts
 
         node1.query("INSERT INTO {} VALUES(toDate('2019-03-15'), 65)".format(name))
         node1.query("INSERT INTO {} VALUES(toDate('2019-03-16'), 66)".format(name))
@@ -585,34 +617,45 @@ def test_alter_move(start_cluster, name, engine):
         used_disks = get_used_disks_for_table(node1, name)
         assert all(d.startswith("jbod") for d in used_disks), "All writes should go to jbods"
 
-        first_part = node1.query("SELECT name FROM system.parts WHERE table = '{}' and active = 1 ORDER BY modification_time LIMIT 1".format(name)).strip()
+        first_part = node1.query(
+            "SELECT name FROM system.parts WHERE table = '{}' and active = 1 ORDER BY modification_time LIMIT 1".format(
+                name)).strip()
 
         time.sleep(1)
         node1.query("ALTER TABLE {} MOVE PART '{}' TO VOLUME 'external'".format(name, first_part))
-        disk = node1.query("SELECT disk_name FROM system.parts WHERE table = '{}' and name = '{}' and active = 1".format(name, first_part)).strip()
+        disk = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{}' and name = '{}' and active = 1".format(name,
+                                                                                                          first_part)).strip()
         assert disk == 'external'
         assert get_path_for_part_from_part_log(node1, name, first_part).startswith("/external")
 
-
         time.sleep(1)
         node1.query("ALTER TABLE {} MOVE PART '{}' TO DISK 'jbod1'".format(name, first_part))
-        disk = node1.query("SELECT disk_name FROM system.parts WHERE table = '{}' and name = '{}' and active = 1".format(name, first_part)).strip()
+        disk = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{}' and name = '{}' and active = 1".format(name,
+                                                                                                          first_part)).strip()
         assert disk == 'jbod1'
         assert get_path_for_part_from_part_log(node1, name, first_part).startswith("/jbod1")
 
         time.sleep(1)
         node1.query("ALTER TABLE {} MOVE PARTITION 201904 TO VOLUME 'external'".format(name))
-        disks = node1.query("SELECT disk_name FROM system.parts WHERE table = '{}' and partition = '201904' and active = 1".format(name)).strip().split('\n')
+        disks = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{}' and partition = '201904' and active = 1".format(
+                name)).strip().split('\n')
         assert len(disks) == 2
         assert all(d == "external" for d in disks)
-        assert all(path.startswith("/external") for path in get_paths_for_partition_from_part_log(node1, name, '201904')[:2])
+        assert all(
+            path.startswith("/external") for path in get_paths_for_partition_from_part_log(node1, name, '201904')[:2])
 
         time.sleep(1)
         node1.query("ALTER TABLE {} MOVE PARTITION 201904 TO DISK 'jbod2'".format(name))
-        disks = node1.query("SELECT disk_name FROM system.parts WHERE table = '{}' and partition = '201904' and active = 1".format(name)).strip().split('\n')
+        disks = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{}' and partition = '201904' and active = 1".format(
+                name)).strip().split('\n')
         assert len(disks) == 2
         assert all(d == "jbod2" for d in disks)
-        assert all(path.startswith("/jbod2") for path in get_paths_for_partition_from_part_log(node1, name, '201904')[:2])
+        assert all(
+            path.startswith("/jbod2") for path in get_paths_for_partition_from_part_log(node1, name, '201904')[:2])
 
         assert node1.query("SELECT COUNT() FROM {}".format(name)) == "4\n"
 
@@ -650,13 +693,18 @@ def test_alter_move_half_of_partition(start_cluster, volume_or_disk):
         assert len(parts) == 2
 
         node1.query("ALTER TABLE {} MOVE PART '{}' TO VOLUME 'external'".format(name, parts[0]))
-        disks = node1.query("SELECT disk_name FROM system.parts WHERE table = '{}' and name = '{}' and active = 1".format(name, parts[0])).splitlines()
+        disks = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{}' and name = '{}' and active = 1".format(name, parts[
+                0])).splitlines()
         assert disks == ["external"]
 
         time.sleep(1)
-        node1.query("ALTER TABLE {} MOVE PARTITION 201903 TO {volume_or_disk} 'external'".format(name, volume_or_disk=volume_or_disk))
-        disks = node1.query("SELECT disk_name FROM system.parts WHERE table = '{}' and partition = '201903' and active = 1".format(name)).splitlines()
-        assert disks == ["external"]*2
+        node1.query("ALTER TABLE {} MOVE PARTITION 201903 TO {volume_or_disk} 'external'".format(name,
+                                                                                                 volume_or_disk=volume_or_disk))
+        disks = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{}' and partition = '201903' and active = 1".format(
+                name)).splitlines()
+        assert disks == ["external"] * 2
 
         assert node1.query("SELECT COUNT() FROM {}".format(name)) == "2\n"
 
@@ -690,15 +738,19 @@ def test_alter_double_move_partition(start_cluster, volume_or_disk):
         assert all(d.startswith("jbod") for d in used_disks), "All writes should go to jbods"
 
         time.sleep(1)
-        node1.query("ALTER TABLE {} MOVE PARTITION 201903 TO {volume_or_disk} 'external'".format(name, volume_or_disk=volume_or_disk))
-        disks = node1.query("SELECT disk_name FROM system.parts WHERE table = '{}' and partition = '201903' and active = 1".format(name)).splitlines()
-        assert disks == ["external"]*2
+        node1.query("ALTER TABLE {} MOVE PARTITION 201903 TO {volume_or_disk} 'external'".format(name,
+                                                                                                 volume_or_disk=volume_or_disk))
+        disks = node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{}' and partition = '201903' and active = 1".format(
+                name)).splitlines()
+        assert disks == ["external"] * 2
 
         assert node1.query("SELECT COUNT() FROM {}".format(name)) == "2\n"
 
         time.sleep(1)
         with pytest.raises(QueryRuntimeException):
-            node1.query("ALTER TABLE {} MOVE PARTITION 201903 TO {volume_or_disk} 'external'".format(name, volume_or_disk=volume_or_disk))
+            node1.query("ALTER TABLE {} MOVE PARTITION 201903 TO {volume_or_disk} 'external'".format(name,
+                                                                                                     volume_or_disk=volume_or_disk))
 
     finally:
         node1.query("DROP TABLE IF EXISTS {name}".format(name=name))
@@ -709,14 +761,14 @@ def produce_alter_move(node, name):
     if move_type == "PART":
         for _ in range(10):
             try:
-                parts = node1.query("SELECT name from system.parts where table = '{}' and active = 1".format(name)).strip().split('\n')
+                parts = node1.query(
+                    "SELECT name from system.parts where table = '{}' and active = 1".format(name)).strip().split('\n')
                 break
             except QueryRuntimeException:
                 pass
         else:
             raise Exception("Cannot select from system.parts")
 
-
         move_part = random.choice(["'" + part + "'" for part in parts])
     else:
         move_part = random.choice([201903, 201904])
@@ -734,8 +786,9 @@ def produce_alter_move(node, name):
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("concurrently_altering_mt","MergeTree()"),
-    ("concurrently_altering_replicated_mt","ReplicatedMergeTree('/clickhouse/concurrently_altering_replicated_mt', '1')",),
+    ("concurrently_altering_mt", "MergeTree()"),
+    ("concurrently_altering_replicated_mt",
+     "ReplicatedMergeTree('/clickhouse/concurrently_altering_replicated_mt', '1')",),
 ])
 def test_concurrent_alter_move(start_cluster, name, engine):
     try:
@@ -749,7 +802,7 @@ def test_concurrent_alter_move(start_cluster, name, engine):
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
 
-        values = list({ random.randint(1, 1000000) for _ in range(0, 1000) })
+        values = list({random.randint(1, 1000000) for _ in range(0, 1000)})
 
         def insert(num):
             for i in range(num):
@@ -786,9 +839,11 @@ def test_concurrent_alter_move(start_cluster, name, engine):
     finally:
         node1.query("DROP TABLE IF EXISTS {name}".format(name=name))
 
+
 @pytest.mark.parametrize("name,engine", [
-    ("concurrently_dropping_mt","MergeTree()"),
-    ("concurrently_dropping_replicated_mt","ReplicatedMergeTree('/clickhouse/concurrently_dropping_replicated_mt', '1')",),
+    ("concurrently_dropping_mt", "MergeTree()"),
+    ("concurrently_dropping_replicated_mt",
+     "ReplicatedMergeTree('/clickhouse/concurrently_dropping_replicated_mt', '1')",),
 ])
 def test_concurrent_alter_move_and_drop(start_cluster, name, engine):
     try:
@@ -802,7 +857,7 @@ def test_concurrent_alter_move_and_drop(start_cluster, name, engine):
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
 
-        values = list({ random.randint(1, 1000000) for _ in range(0, 1000) })
+        values = list({random.randint(1, 1000000) for _ in range(0, 1000)})
 
         def insert(num):
             for i in range(num):
@@ -839,8 +894,8 @@ def test_concurrent_alter_move_and_drop(start_cluster, name, engine):
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("detach_attach_mt","MergeTree()"),
-    ("replicated_detach_attach_mt","ReplicatedMergeTree('/clickhouse/replicated_detach_attach_mt', '1')",),
+    ("detach_attach_mt", "MergeTree()"),
+    ("replicated_detach_attach_mt", "ReplicatedMergeTree('/clickhouse/replicated_detach_attach_mt', '1')",),
 ])
 def test_detach_attach(start_cluster, name, engine):
     try:
@@ -852,9 +907,9 @@ def test_detach_attach(start_cluster, name, engine):
             SETTINGS storage_policy='moving_jbod_with_external'
         """.format(name=name, engine=engine))
 
-        data = [] # 5MB in total
+        data = []  # 5MB in total
         for i in range(5):
-            data.append(get_random_string(1024 * 1024)) # 1MB row
+            data.append(get_random_string(1024 * 1024))  # 1MB row
         node1.query("INSERT INTO {} VALUES {}".format(name, ','.join(["('" + x + "')" for x in data])))
 
         node1.query("ALTER TABLE {} DETACH PARTITION tuple()".format(name))
@@ -870,8 +925,8 @@ def test_detach_attach(start_cluster, name, engine):
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("mutating_mt","MergeTree()"),
-    ("replicated_mutating_mt","ReplicatedMergeTree('/clickhouse/replicated_mutating_mt', '1')",),
+    ("mutating_mt", "MergeTree()"),
+    ("replicated_mutating_mt", "ReplicatedMergeTree('/clickhouse/replicated_mutating_mt', '1')",),
 ])
 def test_mutate_to_another_disk(start_cluster, name, engine):
     try:
@@ -884,9 +939,9 @@ def test_mutate_to_another_disk(start_cluster, name, engine):
         """.format(name=name, engine=engine))
 
         for i in range(5):
-            data = [] # 5MB in total
+            data = []  # 5MB in total
             for i in range(5):
-                data.append(get_random_string(1024 * 1024)) # 1MB row
+                data.append(get_random_string(1024 * 1024))  # 1MB row
             node1.query("INSERT INTO {} VALUES {}".format(name, ','.join(["('" + x + "')" for x in data])))
 
         node1.query("ALTER TABLE {} UPDATE s1 = concat(s1, 'x') WHERE 1".format(name))
@@ -898,7 +953,7 @@ def test_mutate_to_another_disk(start_cluster, name, engine):
 
         if node1.query("SELECT latest_fail_reason FROM system.mutations WHERE table = '{}'".format(name)) == "":
             assert node1.query("SELECT sum(endsWith(s1, 'x')) FROM {}".format(name)) == "25\n"
-        else: # mutation failed, let's try on another disk
+        else:  # mutation failed, let's try on another disk
             print "Mutation failed"
             node1.query("OPTIMIZE TABLE {} FINAL".format(name))
             node1.query("ALTER TABLE {} UPDATE s1 = concat(s1, 'x') WHERE 1".format(name))
@@ -914,9 +969,10 @@ def test_mutate_to_another_disk(start_cluster, name, engine):
     finally:
         node1.query("DROP TABLE IF EXISTS {name}".format(name=name))
 
+
 @pytest.mark.parametrize("name,engine", [
-    ("alter_modifying_mt","MergeTree()"),
-    ("replicated_alter_modifying_mt","ReplicatedMergeTree('/clickhouse/replicated_alter_modifying_mt', '1')",),
+    ("alter_modifying_mt", "MergeTree()"),
+    ("replicated_alter_modifying_mt", "ReplicatedMergeTree('/clickhouse/replicated_alter_modifying_mt', '1')",),
 ])
 def test_concurrent_alter_modify(start_cluster, name, engine):
     try:
@@ -930,7 +986,7 @@ def test_concurrent_alter_modify(start_cluster, name, engine):
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
 
-        values = list({ random.randint(1, 1000000) for _ in range(0, 1000) })
+        values = list({random.randint(1, 1000000) for _ in range(0, 1000)})
 
         def insert(num):
             for i in range(num):
@@ -971,6 +1027,7 @@ def test_concurrent_alter_modify(start_cluster, name, engine):
     finally:
         node1.query("DROP TABLE IF EXISTS {name}".format(name=name))
 
+
 def test_simple_replication_and_moves(start_cluster):
     try:
         for i, node in enumerate([node1, node2]):
@@ -983,17 +1040,18 @@ def test_simple_replication_and_moves(start_cluster):
             """.format(i + 1))
 
         def insert(num):
-           for i in range(num):
-               node = random.choice([node1, node2])
-               data = [] # 1MB in total
-               for i in range(2):
-                   data.append(get_random_string(512 * 1024)) # 500KB value
-               node.query("INSERT INTO replicated_table_for_moves VALUES {}".format(','.join(["('" + x + "')" for x in data])))
+            for i in range(num):
+                node = random.choice([node1, node2])
+                data = []  # 1MB in total
+                for i in range(2):
+                    data.append(get_random_string(512 * 1024))  # 500KB value
+                node.query("INSERT INTO replicated_table_for_moves VALUES {}".format(
+                    ','.join(["('" + x + "')" for x in data])))
 
         def optimize(num):
-           for i in range(num):
-               node = random.choice([node1, node2])
-               node.query("OPTIMIZE TABLE replicated_table_for_moves FINAL")
+            for i in range(num):
+                node = random.choice([node1, node2])
+                node.query("OPTIMIZE TABLE replicated_table_for_moves FINAL")
 
         p = Pool(60)
         tasks = []
@@ -1009,18 +1067,20 @@ def test_simple_replication_and_moves(start_cluster):
         node1.query("SELECT COUNT() FROM replicated_table_for_moves") == "40\n"
         node2.query("SELECT COUNT() FROM replicated_table_for_moves") == "40\n"
 
-        data = [] # 1MB in total
+        data = []  # 1MB in total
         for i in range(2):
-            data.append(get_random_string(512 * 1024)) # 500KB value
+            data.append(get_random_string(512 * 1024))  # 500KB value
 
-        time.sleep(3) # wait until old parts will be deleted
+        time.sleep(3)  # wait until old parts will be deleted
         node1.query("SYSTEM STOP MERGES")
         node2.query("SYSTEM STOP MERGES")
 
-        node1.query("INSERT INTO replicated_table_for_moves VALUES {}".format(','.join(["('" + x + "')" for x in data])))
-        node2.query("INSERT INTO replicated_table_for_moves VALUES {}".format(','.join(["('" + x + "')" for x in data])))
+        node1.query(
+            "INSERT INTO replicated_table_for_moves VALUES {}".format(','.join(["('" + x + "')" for x in data])))
+        node2.query(
+            "INSERT INTO replicated_table_for_moves VALUES {}".format(','.join(["('" + x + "')" for x in data])))
 
-        time.sleep(3) # nothing was moved
+        time.sleep(3)  # nothing was moved
 
         disks1 = get_used_disks_for_table(node1, "replicated_table_for_moves")
         disks2 = get_used_disks_for_table(node2, "replicated_table_for_moves")
@@ -1034,6 +1094,7 @@ def test_simple_replication_and_moves(start_cluster):
         for node in [node1, node2]:
             node.query("DROP TABLE IF EXISTS replicated_table_for_moves")
 
+
 def test_download_appropriate_disk(start_cluster):
     try:
         for i, node in enumerate([node1, node2]):
@@ -1047,8 +1108,9 @@ def test_download_appropriate_disk(start_cluster):
 
         data = []
         for i in range(50):
-            data.append(get_random_string(1024 * 1024)) # 1MB value
-        node1.query("INSERT INTO replicated_table_for_download VALUES {}".format(','.join(["('" + x + "')" for x in data])))
+            data.append(get_random_string(1024 * 1024))  # 1MB value
+        node1.query(
+            "INSERT INTO replicated_table_for_download VALUES {}".format(','.join(["('" + x + "')" for x in data])))
 
         for _ in range(10):
             try:
@@ -1066,6 +1128,7 @@ def test_download_appropriate_disk(start_cluster):
         for node in [node1, node2]:
             node.query("DROP TABLE IF EXISTS replicated_table_for_download")
 
+
 def test_rename(start_cluster):
     try:
         node1.query("""
@@ -1079,7 +1142,7 @@ def test_rename(start_cluster):
         for _ in range(5):
             data = []
             for i in range(10):
-                data.append(get_random_string(1024 * 1024)) # 1MB value
+                data.append(get_random_string(1024 * 1024))  # 1MB value
             node1.query("INSERT INTO renaming_table VALUES {}".format(','.join(["('" + x + "')" for x in data])))
 
         disks = get_used_disks_for_table(node1, "renaming_table")
@@ -1121,9 +1184,10 @@ def test_freeze(start_cluster):
             data = []
             dates = []
             for i in range(10):
-                data.append(get_random_string(1024 * 1024)) # 1MB value
+                data.append(get_random_string(1024 * 1024))  # 1MB value
                 dates.append("toDate('2019-03-05')")
-            node1.query("INSERT INTO freezing_table VALUES {}".format(','.join(["(" + d + ", '" + s + "')" for d, s in zip(dates, data)])))
+            node1.query("INSERT INTO freezing_table VALUES {}".format(
+                ','.join(["(" + d + ", '" + s + "')" for d, s in zip(dates, data)])))
 
         disks = get_used_disks_for_table(node1, "freezing_table")
         assert len(disks) > 1
@@ -1154,7 +1218,7 @@ def test_kill_while_insert(start_cluster):
         data = []
         dates = []
         for i in range(10):
-            data.append(get_random_string(1024 * 1024)) # 1MB value
+            data.append(get_random_string(1024 * 1024))  # 1MB value
         node1.query("INSERT INTO {name} VALUES {}".format(','.join(["('" + s + "')" for s in data]), name=name))
 
         disks = get_used_disks_for_table(node1, name)
@@ -1199,7 +1263,8 @@ def test_move_while_merge(start_cluster):
         node1.query("INSERT INTO {name} VALUES (1)".format(name=name))
         node1.query("INSERT INTO {name} VALUES (2)".format(name=name))
 
-        parts = node1.query("SELECT name FROM system.parts WHERE table = '{name}' AND active = 1".format(name=name)).splitlines()
+        parts = node1.query(
+            "SELECT name FROM system.parts WHERE table = '{name}' AND active = 1".format(name=name)).splitlines()
         assert len(parts) == 2
 
         def optimize():
@@ -1219,7 +1284,8 @@ def test_move_while_merge(start_cluster):
         def alter():
             while not exiting:
                 try:
-                    node1.query("ALTER TABLE {name} MOVE PART '{part}' TO DISK 'external'".format(name=name, part=parts[0]))
+                    node1.query(
+                        "ALTER TABLE {name} MOVE PART '{part}' TO DISK 'external'".format(name=name, part=parts[0]))
                     no_exception['missing'] = 'exception'
                     break
                 except QueryRuntimeException:
diff --git a/tests/integration/test_mutations_hardlinks/test.py b/tests/integration/test_mutations_hardlinks/test.py
index 56852f572ff..103cf7c2e36 100644
--- a/tests/integration/test_mutations_hardlinks/test.py
+++ b/tests/integration/test_mutations_hardlinks/test.py
@@ -1,16 +1,16 @@
-import pytest
-
 import os
 import time
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry
 from multiprocessing.dummy import Pool
 
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1')
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -38,20 +38,23 @@ def check_exists(table, part_path, column_file):
 
 
 def test_update_mutation(started_cluster):
-    node1.query("CREATE TABLE table_for_update(key UInt64, value1 UInt64, value2 String) ENGINE MergeTree() ORDER BY tuple()")
+    node1.query(
+        "CREATE TABLE table_for_update(key UInt64, value1 UInt64, value2 String) ENGINE MergeTree() ORDER BY tuple()")
 
     node1.query("INSERT INTO table_for_update SELECT number, number, toString(number) from numbers(100)")
 
     assert int(node1.query("SELECT sum(value1) FROM table_for_update").strip()) == sum(range(100))
 
-    node1.query("ALTER TABLE table_for_update UPDATE value1 = value1 * value1 WHERE 1", settings={"mutations_sync" : "2"})
+    node1.query("ALTER TABLE table_for_update UPDATE value1 = value1 * value1 WHERE 1",
+                settings={"mutations_sync": "2"})
     assert int(node1.query("SELECT sum(value1) FROM table_for_update").strip()) == sum(i * i for i in range(100))
 
     check_hardlinks("table_for_update", "all_1_1_0_2", "key.bin", 2)
     check_hardlinks("table_for_update", "all_1_1_0_2", "value2.bin", 2)
     check_hardlinks("table_for_update", "all_1_1_0_2", "value1.bin", 1)
 
-    node1.query("ALTER TABLE table_for_update UPDATE key=key, value1=value1, value2=value2 WHERE 1", settings={"mutations_sync": "2"})
+    node1.query("ALTER TABLE table_for_update UPDATE key=key, value1=value1, value2=value2 WHERE 1",
+                settings={"mutations_sync": "2"})
 
     assert int(node1.query("SELECT sum(value1) FROM table_for_update").strip()) == sum(i * i for i in range(100))
 
@@ -61,13 +64,14 @@ def test_update_mutation(started_cluster):
 
 
 def test_modify_mutation(started_cluster):
-    node1.query("CREATE TABLE table_for_modify(key UInt64, value1 UInt64, value2 String) ENGINE MergeTree() ORDER BY tuple()")
+    node1.query(
+        "CREATE TABLE table_for_modify(key UInt64, value1 UInt64, value2 String) ENGINE MergeTree() ORDER BY tuple()")
 
     node1.query("INSERT INTO table_for_modify SELECT number, number, toString(number) from numbers(100)")
 
     assert int(node1.query("SELECT sum(value1) FROM table_for_modify").strip()) == sum(range(100))
 
-    node1.query("ALTER TABLE table_for_modify MODIFY COLUMN value2 UInt64", settings={"mutations_sync" : "2"})
+    node1.query("ALTER TABLE table_for_modify MODIFY COLUMN value2 UInt64", settings={"mutations_sync": "2"})
 
     assert int(node1.query("SELECT sum(value2) FROM table_for_modify").strip()) == sum(range(100))
 
@@ -77,7 +81,8 @@ def test_modify_mutation(started_cluster):
 
 
 def test_drop_mutation(started_cluster):
-    node1.query("CREATE TABLE table_for_drop(key UInt64, value1 UInt64, value2 String) ENGINE MergeTree() ORDER BY tuple()")
+    node1.query(
+        "CREATE TABLE table_for_drop(key UInt64, value1 UInt64, value2 String) ENGINE MergeTree() ORDER BY tuple()")
 
     node1.query("INSERT INTO table_for_drop SELECT number, number, toString(number) from numbers(100)")
 
@@ -95,7 +100,8 @@ def test_drop_mutation(started_cluster):
 
 
 def test_delete_and_drop_mutation(started_cluster):
-    node1.query("CREATE TABLE table_for_delete_and_drop(key UInt64, value1 UInt64, value2 String) ENGINE MergeTree() ORDER BY tuple()")
+    node1.query(
+        "CREATE TABLE table_for_delete_and_drop(key UInt64, value1 UInt64, value2 String) ENGINE MergeTree() ORDER BY tuple()")
 
     node1.query("INSERT INTO table_for_delete_and_drop SELECT number, number, toString(number) from numbers(100)")
 
@@ -110,7 +116,8 @@ def test_delete_and_drop_mutation(started_cluster):
     p.apply_async(mutate)
 
     for _ in range(1, 100):
-        result = node1.query("SELECT COUNT() FROM system.mutations WHERE table = 'table_for_delete_and_drop' and is_done=0")
+        result = node1.query(
+            "SELECT COUNT() FROM system.mutations WHERE table = 'table_for_delete_and_drop' and is_done=0")
         try:
             if int(result.strip()) == 2:
                 break
@@ -122,7 +129,8 @@ def test_delete_and_drop_mutation(started_cluster):
 
     node1.query("SYSTEM START MERGES")
 
-    assert_eq_with_retry(node1, "SELECT COUNT() FROM table_for_delete_and_drop", str(sum(1 for i in range(100) if i % 2 != 0)))
+    assert_eq_with_retry(node1, "SELECT COUNT() FROM table_for_delete_and_drop",
+                         str(sum(1 for i in range(100) if i % 2 != 0)))
 
     check_hardlinks("table_for_delete_and_drop", "all_1_1_0_3", "key.bin", 1)
     check_hardlinks("table_for_delete_and_drop", "all_1_1_0_3", "value1.bin", 1)
diff --git a/tests/integration/test_mutations_with_merge_tree/test.py b/tests/integration/test_mutations_with_merge_tree/test.py
index c52e3343712..019f8c2ea40 100644
--- a/tests/integration/test_mutations_with_merge_tree/test.py
+++ b/tests/integration/test_mutations_with_merge_tree/test.py
@@ -1,21 +1,22 @@
-from contextlib import contextmanager
-
 import time
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 
-instance_test_mutations = cluster.add_instance('test_mutations_with_merge_tree', main_configs=['configs/config.xml'], user_configs=['configs/users.xml'])
+instance_test_mutations = cluster.add_instance('test_mutations_with_merge_tree', main_configs=['configs/config.xml'],
+                                               user_configs=['configs/users.xml'])
 
 
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
         cluster.start()
-        instance_test_mutations.query('''CREATE TABLE test_mutations_with_ast_elements(date Date, a UInt64, b String) ENGINE = MergeTree(date, (a, date), 8192)''')
-        instance_test_mutations.query('''INSERT INTO test_mutations_with_ast_elements SELECT '2019-07-29' AS date, 1, toString(number) FROM numbers(1)''')
+        instance_test_mutations.query(
+            '''CREATE TABLE test_mutations_with_ast_elements(date Date, a UInt64, b String) ENGINE = MergeTree(date, (a, date), 8192)''')
+        instance_test_mutations.query(
+            '''INSERT INTO test_mutations_with_ast_elements SELECT '2019-07-29' AS date, 1, toString(number) FROM numbers(1)''')
         yield cluster
     finally:
         cluster.shutdown()
@@ -26,31 +27,36 @@ def test_mutations_with_merge_background_task(started_cluster):
 
     ## The number of asts per query is 15
     for execution_times_for_mutation in range(100):
-        instance_test_mutations.query('''ALTER TABLE test_mutations_with_ast_elements DELETE WHERE 1 = 1 AND toUInt32(b) IN (1)''')
+        instance_test_mutations.query(
+            '''ALTER TABLE test_mutations_with_ast_elements DELETE WHERE 1 = 1 AND toUInt32(b) IN (1)''')
 
     all_done = False
-    for wait_times_for_mutation in range(100): # wait for replication 80 seconds max
+    for wait_times_for_mutation in range(100):  # wait for replication 80 seconds max
         time.sleep(0.8)
 
         def get_done_mutations(instance):
             instance_test_mutations.query('''DETACH TABLE test_mutations_with_ast_elements''')
             instance_test_mutations.query('''ATTACH TABLE test_mutations_with_ast_elements''')
-            return int(instance.query("SELECT sum(is_done) FROM system.mutations WHERE table = 'test_mutations_with_ast_elements'").rstrip())
+            return int(instance.query(
+                "SELECT sum(is_done) FROM system.mutations WHERE table = 'test_mutations_with_ast_elements'").rstrip())
 
         if get_done_mutations(instance_test_mutations) == 100:
             all_done = True
             break
 
-    print instance_test_mutations.query("SELECT mutation_id, command, parts_to_do, is_done FROM system.mutations WHERE table = 'test_mutations_with_ast_elements' FORMAT TSVWithNames")
+    print instance_test_mutations.query(
+        "SELECT mutation_id, command, parts_to_do, is_done FROM system.mutations WHERE table = 'test_mutations_with_ast_elements' FORMAT TSVWithNames")
     assert all_done
 
+
 def test_mutations_with_truncate_table(started_cluster):
     instance_test_mutations.query('''SYSTEM STOP MERGES test_mutations_with_ast_elements''')
 
     ## The number of asts per query is 15
     for execute_number in range(100):
-        instance_test_mutations.query('''ALTER TABLE test_mutations_with_ast_elements DELETE WHERE 1 = 1 AND toUInt32(b) IN (1)''')
+        instance_test_mutations.query(
+            '''ALTER TABLE test_mutations_with_ast_elements DELETE WHERE 1 = 1 AND toUInt32(b) IN (1)''')
 
     instance_test_mutations.query("TRUNCATE TABLE test_mutations_with_ast_elements")
-    assert instance_test_mutations.query("SELECT COUNT() FROM system.mutations WHERE table = 'test_mutations_with_ast_elements'").rstrip() == '0'
-
+    assert instance_test_mutations.query(
+        "SELECT COUNT() FROM system.mutations WHERE table = 'test_mutations_with_ast_elements'").rstrip() == '0'
diff --git a/tests/integration/test_mysql_database_engine/test.py b/tests/integration/test_mysql_database_engine/test.py
index 86cfa0364d3..399b9263123 100644
--- a/tests/integration/test_mysql_database_engine/test.py
+++ b/tests/integration/test_mysql_database_engine/test.py
@@ -1,13 +1,11 @@
-import time
 import contextlib
+import time
+from string import Template
 
 import pymysql.cursors
 import pytest
-
-from helpers.cluster import ClickHouseCluster
 from helpers.client import QueryRuntimeException
-
-from string import Template
+from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 clickhouse_node = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], with_mysql=True)
@@ -32,7 +30,8 @@ class MySQLNodeInstance:
 
     def query(self, execution_query):
         if self.mysql_connection is None:
-            self.mysql_connection = pymysql.connect(user=self.user, password=self.password, host=self.hostname, port=self.port)
+            self.mysql_connection = pymysql.connect(user=self.user, password=self.password, host=self.hostname,
+                                                    port=self.port)
         with self.mysql_connection.cursor() as cursor:
             def execute(query):
                 res = cursor.execute(query)
@@ -59,19 +58,25 @@ def test_mysql_ddl_for_mysql_database(started_cluster):
     with contextlib.closing(MySQLNodeInstance('root', 'clickhouse', '127.0.0.1', port=3308)) as mysql_node:
         mysql_node.query("CREATE DATABASE test_database DEFAULT CHARACTER SET 'utf8'")
 
-        clickhouse_node.query("CREATE DATABASE test_database ENGINE = MySQL('mysql1:3306', 'test_database', 'root', 'clickhouse')")
+        clickhouse_node.query(
+            "CREATE DATABASE test_database ENGINE = MySQL('mysql1:3306', 'test_database', 'root', 'clickhouse')")
         assert 'test_database' in clickhouse_node.query('SHOW DATABASES')
 
-        mysql_node.query('CREATE TABLE `test_database`.`test_table` ( `id` int(11) NOT NULL, PRIMARY KEY (`id`) ) ENGINE=InnoDB;')
+        mysql_node.query(
+            'CREATE TABLE `test_database`.`test_table` ( `id` int(11) NOT NULL, PRIMARY KEY (`id`) ) ENGINE=InnoDB;')
         assert 'test_table' in clickhouse_node.query('SHOW TABLES FROM test_database')
 
-        time.sleep(3)  # Because the unit of MySQL modification time is seconds, modifications made in the same second cannot be obtained
+        time.sleep(
+            3)  # Because the unit of MySQL modification time is seconds, modifications made in the same second cannot be obtained
         mysql_node.query('ALTER TABLE `test_database`.`test_table` ADD COLUMN `add_column` int(11)')
-        assert 'add_column' in clickhouse_node.query("SELECT name FROM system.columns WHERE table = 'test_table' AND database = 'test_database'")
+        assert 'add_column' in clickhouse_node.query(
+            "SELECT name FROM system.columns WHERE table = 'test_table' AND database = 'test_database'")
 
-        time.sleep(3)  # Because the unit of MySQL modification time is seconds, modifications made in the same second cannot be obtained
+        time.sleep(
+            3)  # Because the unit of MySQL modification time is seconds, modifications made in the same second cannot be obtained
         mysql_node.query('ALTER TABLE `test_database`.`test_table` DROP COLUMN `add_column`')
-        assert 'add_column' not in clickhouse_node.query("SELECT name FROM system.columns WHERE table = 'test_table' AND database = 'test_database'")
+        assert 'add_column' not in clickhouse_node.query(
+            "SELECT name FROM system.columns WHERE table = 'test_table' AND database = 'test_database'")
 
         mysql_node.query('DROP TABLE `test_database`.`test_table`;')
         assert 'test_table' not in clickhouse_node.query('SHOW TABLES FROM test_database')
@@ -85,9 +90,11 @@ def test_mysql_ddl_for_mysql_database(started_cluster):
 def test_clickhouse_ddl_for_mysql_database(started_cluster):
     with contextlib.closing(MySQLNodeInstance('root', 'clickhouse', '127.0.0.1', port=3308)) as mysql_node:
         mysql_node.query("CREATE DATABASE test_database DEFAULT CHARACTER SET 'utf8'")
-        mysql_node.query('CREATE TABLE `test_database`.`test_table` ( `id` int(11) NOT NULL, PRIMARY KEY (`id`) ) ENGINE=InnoDB;')
+        mysql_node.query(
+            'CREATE TABLE `test_database`.`test_table` ( `id` int(11) NOT NULL, PRIMARY KEY (`id`) ) ENGINE=InnoDB;')
 
-        clickhouse_node.query("CREATE DATABASE test_database ENGINE = MySQL('mysql1:3306', 'test_database', 'root', 'clickhouse')")
+        clickhouse_node.query(
+            "CREATE DATABASE test_database ENGINE = MySQL('mysql1:3306', 'test_database', 'root', 'clickhouse')")
 
         assert 'test_table' in clickhouse_node.query('SHOW TABLES FROM test_database')
         clickhouse_node.query("DROP TABLE test_database.test_table")
@@ -108,8 +115,10 @@ def test_clickhouse_ddl_for_mysql_database(started_cluster):
 def test_clickhouse_dml_for_mysql_database(started_cluster):
     with contextlib.closing(MySQLNodeInstance('root', 'clickhouse', '127.0.0.1', port=3308)) as mysql_node:
         mysql_node.query("CREATE DATABASE test_database DEFAULT CHARACTER SET 'utf8'")
-        mysql_node.query('CREATE TABLE `test_database`.`test_table` ( `i``d` int(11) NOT NULL, PRIMARY KEY (`i``d`)) ENGINE=InnoDB;')
-        clickhouse_node.query("CREATE DATABASE test_database ENGINE = MySQL('mysql1:3306', test_database, 'root', 'clickhouse')")
+        mysql_node.query(
+            'CREATE TABLE `test_database`.`test_table` ( `i``d` int(11) NOT NULL, PRIMARY KEY (`i``d`)) ENGINE=InnoDB;')
+        clickhouse_node.query(
+            "CREATE DATABASE test_database ENGINE = MySQL('mysql1:3306', test_database, 'root', 'clickhouse')")
 
         assert clickhouse_node.query("SELECT count() FROM `test_database`.`test_table`").rstrip() == '0'
         clickhouse_node.query("INSERT INTO `test_database`.`test_table`(`i``d`) select number from numbers(10000)")
@@ -130,8 +139,10 @@ def test_clickhouse_join_for_mysql_database(started_cluster):
                          "service VARCHAR(5) DEFAULT '' NOT NULL,"
                          "opco    VARCHAR(5) DEFAULT ''"
                          ")")
-        clickhouse_node.query("CREATE TABLE default.t1_remote_mysql AS mysql('mysql1:3306','test','t1_mysql_local','root','clickhouse')")
-        clickhouse_node.query("CREATE TABLE default.t2_remote_mysql AS mysql('mysql1:3306','test','t2_mysql_local','root','clickhouse')")
+        clickhouse_node.query(
+            "CREATE TABLE default.t1_remote_mysql AS mysql('mysql1:3306','test','t1_mysql_local','root','clickhouse')")
+        clickhouse_node.query(
+            "CREATE TABLE default.t2_remote_mysql AS mysql('mysql1:3306','test','t2_mysql_local','root','clickhouse')")
         assert clickhouse_node.query("SELECT s.pays "
                                      "FROM default.t1_remote_mysql AS s "
                                      "LEFT JOIN default.t1_remote_mysql AS s_ref "
@@ -143,7 +154,8 @@ def test_bad_arguments_for_mysql_database_engine(started_cluster):
     with contextlib.closing(MySQLNodeInstance('root', 'clickhouse', '127.0.0.1', port=3308)) as mysql_node:
         with pytest.raises(QueryRuntimeException) as exception:
             mysql_node.query("CREATE DATABASE IF NOT EXISTS test_bad_arguments DEFAULT CHARACTER SET 'utf8'")
-            clickhouse_node.query("CREATE DATABASE test_database_bad_arguments ENGINE = MySQL('mysql1:3306', test_bad_arguments, root, 'clickhouse')")
+            clickhouse_node.query(
+                "CREATE DATABASE test_database_bad_arguments ENGINE = MySQL('mysql1:3306', test_bad_arguments, root, 'clickhouse')")
         assert 'Database engine MySQL requested literal argument.' in str(exception.value)
         mysql_node.query("DROP DATABASE test_bad_arguments")
 
@@ -152,46 +164,57 @@ decimal_values = [0.123, 0.4, 5.67, 8.91011, 123456789.123, -0.123, -0.4, -5.67,
 timestamp_values = ['2015-05-18 07:40:01.123', '2019-09-16 19:20:11.123']
 timestamp_values_no_subsecond = ['2015-05-18 07:40:01', '2019-09-16 19:20:11']
 
+
 @pytest.mark.parametrize("case_name, mysql_type, expected_ch_type, mysql_values, setting_mysql_datatypes_support_level",
-[
-    ("decimal_default", "decimal NOT NULL", "Decimal(10, 0)", decimal_values, "decimal,datetime64"),
-    ("decimal_default_nullable", "decimal", "Nullable(Decimal(10, 0))", decimal_values, "decimal,datetime64"),
-    ("decimal_18_6", "decimal(18, 6) NOT NULL", "Decimal(18, 6)", decimal_values, "decimal,datetime64"),
-    ("decimal_38_6", "decimal(38, 6) NOT NULL", "Decimal(38, 6)", decimal_values, "decimal,datetime64"),
+                         [
+                             ("decimal_default", "decimal NOT NULL", "Decimal(10, 0)", decimal_values,
+                              "decimal,datetime64"),
+                             ("decimal_default_nullable", "decimal", "Nullable(Decimal(10, 0))", decimal_values,
+                              "decimal,datetime64"),
+                             ("decimal_18_6", "decimal(18, 6) NOT NULL", "Decimal(18, 6)", decimal_values,
+                              "decimal,datetime64"),
+                             ("decimal_38_6", "decimal(38, 6) NOT NULL", "Decimal(38, 6)", decimal_values,
+                              "decimal,datetime64"),
 
-    # Due to python DB driver roundtrip MySQL timestamp and datetime values
-    # are printed with 6 digits after decimal point, so to simplify tests a bit,
-    # we only validate precision of 0 and 6.
-    ("timestamp_default", "timestamp", "DateTime", timestamp_values, "decimal,datetime64"),
-    ("timestamp_6", "timestamp(6)", "DateTime64(6)", timestamp_values, "decimal,datetime64"),
-    ("datetime_default", "DATETIME NOT NULL", "DateTime64(0)", timestamp_values, "decimal,datetime64"),
-    ("datetime_6", "DATETIME(6) NOT NULL", "DateTime64(6)", timestamp_values, "decimal,datetime64"),
+                             # Due to python DB driver roundtrip MySQL timestamp and datetime values
+                             # are printed with 6 digits after decimal point, so to simplify tests a bit,
+                             # we only validate precision of 0 and 6.
+                             ("timestamp_default", "timestamp", "DateTime", timestamp_values, "decimal,datetime64"),
+                             ("timestamp_6", "timestamp(6)", "DateTime64(6)", timestamp_values, "decimal,datetime64"),
+                             ("datetime_default", "DATETIME NOT NULL", "DateTime64(0)", timestamp_values,
+                              "decimal,datetime64"),
+                             ("datetime_6", "DATETIME(6) NOT NULL", "DateTime64(6)", timestamp_values,
+                              "decimal,datetime64"),
 
-    # right now precision bigger than 39 is not supported by ClickHouse's Decimal, hence fall back to String
-    ("decimal_40_6", "decimal(40, 6) NOT NULL", "String", decimal_values, "decimal,datetime64"),
-    ("decimal_18_6", "decimal(18, 6) NOT NULL", "String", decimal_values, "datetime64"),
-    ("decimal_18_6", "decimal(18, 6) NOT NULL", "String", decimal_values, ""),
-    ("datetime_6", "DATETIME(6) NOT NULL", "DateTime", timestamp_values_no_subsecond, "decimal"),
-    ("datetime_6", "DATETIME(6) NOT NULL", "DateTime", timestamp_values_no_subsecond, ""),
-])
-def test_mysql_types(started_cluster, case_name, mysql_type, expected_ch_type, mysql_values, setting_mysql_datatypes_support_level):
+                             # right now precision bigger than 39 is not supported by ClickHouse's Decimal, hence fall back to String
+                             (
+                                     "decimal_40_6", "decimal(40, 6) NOT NULL", "String", decimal_values,
+                                     "decimal,datetime64"),
+                             ("decimal_18_6", "decimal(18, 6) NOT NULL", "String", decimal_values, "datetime64"),
+                             ("decimal_18_6", "decimal(18, 6) NOT NULL", "String", decimal_values, ""),
+                             ("datetime_6", "DATETIME(6) NOT NULL", "DateTime", timestamp_values_no_subsecond,
+                              "decimal"),
+                             ("datetime_6", "DATETIME(6) NOT NULL", "DateTime", timestamp_values_no_subsecond, ""),
+                         ])
+def test_mysql_types(started_cluster, case_name, mysql_type, expected_ch_type, mysql_values,
+                     setting_mysql_datatypes_support_level):
     """ Verify that values written to MySQL can be read on ClickHouse side via DB engine MySQL,
     or Table engine MySQL, or mysql() table function.
     Make sure that type is converted properly and values match exactly.
     """
 
     substitutes = dict(
-        mysql_db = 'decimal_support',
-        table_name = case_name,
-        mysql_type = mysql_type,
-        mysql_values = ', '.join('({})'.format(repr(x)) for x in mysql_values),
-        ch_mysql_db = 'mysql_db',
-        ch_mysql_table = 'mysql_table_engine_' + case_name,
-        expected_ch_type = expected_ch_type,
+        mysql_db='decimal_support',
+        table_name=case_name,
+        mysql_type=mysql_type,
+        mysql_values=', '.join('({})'.format(repr(x)) for x in mysql_values),
+        ch_mysql_db='mysql_db',
+        ch_mysql_table='mysql_table_engine_' + case_name,
+        expected_ch_type=expected_ch_type,
     )
 
     clickhouse_query_settings = dict(
-        mysql_datatypes_support_level = setting_mysql_datatypes_support_level
+        mysql_datatypes_support_level=setting_mysql_datatypes_support_level
     )
 
     def execute_query(node, query, **kwargs):
@@ -216,9 +239,8 @@ def test_mysql_types(started_cluster, case_name, mysql_type, expected_ch_type, m
         ])
 
         assert execute_query(mysql_node, "SELECT COUNT(*) FROM ${mysql_db}.${table_name}") \
-            == \
-            "{}".format(len(mysql_values))
-
+               == \
+               "{}".format(len(mysql_values))
 
         # MySQL TABLE ENGINE
         execute_query(clickhouse_node, [
@@ -229,18 +251,17 @@ def test_mysql_types(started_cluster, case_name, mysql_type, expected_ch_type, m
         # Validate type
         assert \
             execute_query(clickhouse_node, "SELECT toTypeName(value) FROM ${ch_mysql_table} LIMIT 1",
-                    settings=clickhouse_query_settings) \
+                          settings=clickhouse_query_settings) \
             == \
             expected_ch_type
 
         # Validate values
         assert \
             execute_query(clickhouse_node, "SELECT value FROM ${ch_mysql_table}",
-                    settings=clickhouse_query_settings) \
+                          settings=clickhouse_query_settings) \
             == \
             execute_query(mysql_node, "SELECT value FROM ${mysql_db}.${table_name}")
 
-
         # MySQL DATABASE ENGINE
         execute_query(clickhouse_node, [
             "DROP DATABASE IF EXISTS ${ch_mysql_db}",
@@ -250,22 +271,23 @@ def test_mysql_types(started_cluster, case_name, mysql_type, expected_ch_type, m
         # Validate type
         assert \
             execute_query(clickhouse_node, "SELECT toTypeName(value) FROM ${ch_mysql_db}.${table_name} LIMIT 1",
-                    settings=clickhouse_query_settings) \
+                          settings=clickhouse_query_settings) \
             == \
             expected_ch_type
 
         # Validate values
         assert \
             execute_query(clickhouse_node, "SELECT value FROM ${ch_mysql_db}.${table_name}",
-                    settings=clickhouse_query_settings) \
+                          settings=clickhouse_query_settings) \
             == \
             execute_query(mysql_node, "SELECT value FROM ${mysql_db}.${table_name}")
 
         # MySQL TABLE FUNCTION
         # Validate type
         assert \
-            execute_query(clickhouse_node, "SELECT toTypeName(value) FROM mysql('mysql1:3306', '${mysql_db}', '${table_name}', 'root', 'clickhouse') LIMIT 1",
-                    settings=clickhouse_query_settings) \
+            execute_query(clickhouse_node,
+                          "SELECT toTypeName(value) FROM mysql('mysql1:3306', '${mysql_db}', '${table_name}', 'root', 'clickhouse') LIMIT 1",
+                          settings=clickhouse_query_settings) \
             == \
             expected_ch_type
 
@@ -273,5 +295,6 @@ def test_mysql_types(started_cluster, case_name, mysql_type, expected_ch_type, m
         assert \
             execute_query(mysql_node, "SELECT value FROM ${mysql_db}.${table_name}") \
             == \
-            execute_query(clickhouse_node, "SELECT value FROM mysql('mysql1:3306', '${mysql_db}', '${table_name}', 'root', 'clickhouse')",
-                    settings=clickhouse_query_settings)
+            execute_query(clickhouse_node,
+                          "SELECT value FROM mysql('mysql1:3306', '${mysql_db}', '${table_name}', 'root', 'clickhouse')",
+                          settings=clickhouse_query_settings)
diff --git a/tests/integration/test_mysql_protocol/test.py b/tests/integration/test_mysql_protocol/test.py
index c1d53fc2b34..b5fd312007a 100644
--- a/tests/integration/test_mysql_protocol/test.py
+++ b/tests/integration/test_mysql_protocol/test.py
@@ -1,19 +1,17 @@
 # coding: utf-8
 
-import docker
 import datetime
 import math
 import os
-import pytest
 import subprocess
 import time
+
+import docker
 import pymysql.connections
-
+import pytest
 from docker.models.containers import Container
-
 from helpers.cluster import ClickHouseCluster, get_docker_compose_path
 
-
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 DOCKER_COMPOSE_PATH = get_docker_compose_path()
 
@@ -37,7 +35,8 @@ def server_address():
 @pytest.fixture(scope='module')
 def mysql_client():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_mysql_client.yml')
-    subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
+    subprocess.check_call(
+        ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
     yield docker.from_env().containers.get(cluster.project_name + '_mysql1_1')
 
 
@@ -63,28 +62,32 @@ def mysql_server(mysql_client):
 @pytest.fixture(scope='module')
 def golang_container():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_mysql_golang_client.yml')
-    subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
+    subprocess.check_call(
+        ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
     yield docker.from_env().containers.get(cluster.project_name + '_golang1_1')
 
 
 @pytest.fixture(scope='module')
 def php_container():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_mysql_php_client.yml')
-    subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
+    subprocess.check_call(
+        ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
     yield docker.from_env().containers.get(cluster.project_name + '_php1_1')
 
 
 @pytest.fixture(scope='module')
 def nodejs_container():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_mysql_js_client.yml')
-    subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
+    subprocess.check_call(
+        ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
     yield docker.from_env().containers.get(cluster.project_name + '_mysqljs1_1')
 
 
 @pytest.fixture(scope='module')
 def java_container():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_mysql_java_client.yml')
-    subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
+    subprocess.check_call(
+        ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--no-build'])
     yield docker.from_env().containers.get(cluster.project_name + '_java1_1')
 
 
@@ -121,7 +124,7 @@ def test_mysql_client(mysql_client, server_address):
 
     assert stdout == 'count()\n1\n'
     assert stderr[0:182] == "mysql: [Warning] Using a password on the command line interface can be insecure.\n" \
-                     "ERROR 81 (00000) at line 1: Code: 81, e.displayText() = DB::Exception: Database system2 doesn't exist"
+                            "ERROR 81 (00000) at line 1: Code: 81, e.displayText() = DB::Exception: Database system2 doesn't exist"
 
     code, (stdout, stderr) = mysql_client.exec_run('''
         mysql --protocol tcp -h {host} -P {port} default -u default --password=123
@@ -139,15 +142,16 @@ def test_mysql_client(mysql_client, server_address):
 
     assert stdout == '\n'.join(['column', '0', '0', '1', '1', '5', '5', 'tmp_column', '0', '1', ''])
 
+
 def test_mysql_client_exception(mysql_client, server_address):
-   # Poco exception.
+    # Poco exception.
     code, (stdout, stderr) = mysql_client.exec_run('''
         mysql --protocol tcp -h {host} -P {port} default -u default --password=123
         -e "CREATE TABLE default.t1_remote_mysql AS mysql('127.0.0.1:10086','default','t1_local','default','');"
     '''.format(host=server_address, port=server_port), demux=True)
 
     assert stderr[0:266] == "mysql: [Warning] Using a password on the command line interface can be insecure.\n" \
-            "ERROR 1000 (00000) at line 1: Poco::Exception. Code: 1000, e.code() = 2002, e.displayText() = mysqlxx::ConnectionFailed: Can't connect to MySQL server on '127.0.0.1' (115) ((nullptr):0)"
+                            "ERROR 1000 (00000) at line 1: Poco::Exception. Code: 1000, e.code() = 2002, e.displayText() = mysqlxx::ConnectionFailed: Can't connect to MySQL server on '127.0.0.1' (115) ((nullptr):0)"
 
 
 def test_mysql_replacement_query(mysql_client, server_address):
@@ -304,28 +308,34 @@ def test_mysql_set_variables(mysql_client, server_address):
 
 
 def test_python_client(server_address):
-    client = pymysql.connections.Connection(host=server_address, user='user_with_double_sha1', password='abacaba', database='default', port=server_port)
+    client = pymysql.connections.Connection(host=server_address, user='user_with_double_sha1', password='abacaba',
+                                            database='default', port=server_port)
 
     with pytest.raises(pymysql.InternalError) as exc_info:
         client.query('select name from tables')
 
-    assert exc_info.value.args[1][0:77] == "Code: 60, e.displayText() = DB::Exception: Table default.tables doesn't exist"
+    assert exc_info.value.args[1][
+           0:77] == "Code: 60, e.displayText() = DB::Exception: Table default.tables doesn't exist"
 
     cursor = client.cursor(pymysql.cursors.DictCursor)
     cursor.execute("select 1 as a, 'тест' as b")
     assert cursor.fetchall() == [{'a': 1, 'b': 'тест'}]
 
     with pytest.raises(pymysql.InternalError) as exc_info:
-        pymysql.connections.Connection(host=server_address, user='default', password='abacab', database='default', port=server_port)
+        pymysql.connections.Connection(host=server_address, user='default', password='abacab', database='default',
+                                       port=server_port)
 
-    assert exc_info.value.args == (516, 'default: Authentication failed: password is incorrect or there is no user with such name')
+    assert exc_info.value.args == (
+        516, 'default: Authentication failed: password is incorrect or there is no user with such name')
 
-    client = pymysql.connections.Connection(host=server_address, user='default', password='123', database='default', port=server_port)
+    client = pymysql.connections.Connection(host=server_address, user='default', password='123', database='default',
+                                            port=server_port)
 
     with pytest.raises(pymysql.InternalError) as exc_info:
         client.query('select name from tables')
 
-    assert exc_info.value.args[1][0:77] == "Code: 60, e.displayText() = DB::Exception: Table default.tables doesn't exist"
+    assert exc_info.value.args[1][
+           0:77] == "Code: 60, e.displayText() = DB::Exception: Table default.tables doesn't exist"
 
     cursor = client.cursor(pymysql.cursors.DictCursor)
     cursor.execute("select 1 as a, 'тест' as b")
@@ -353,55 +363,71 @@ def test_golang_client(server_address, golang_container):
     with open(os.path.join(SCRIPT_DIR, 'golang.reference')) as fp:
         reference = fp.read()
 
-    code, (stdout, stderr) = golang_container.exec_run('./main --host {host} --port {port} --user default --password 123 --database '
-                                                       'abc'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = golang_container.exec_run(
+        './main --host {host} --port {port} --user default --password 123 --database '
+        'abc'.format(host=server_address, port=server_port), demux=True)
 
     assert code == 1
     assert stderr == "Error 81: Database abc doesn't exist\n"
 
-    code, (stdout, stderr) = golang_container.exec_run('./main --host {host} --port {port} --user default --password 123 --database '
-                                                       'default'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = golang_container.exec_run(
+        './main --host {host} --port {port} --user default --password 123 --database '
+        'default'.format(host=server_address, port=server_port), demux=True)
 
     assert code == 0
     assert stdout == reference
 
-    code, (stdout, stderr) = golang_container.exec_run('./main --host {host} --port {port} --user user_with_double_sha1 --password abacaba --database '
-                                                       'default'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = golang_container.exec_run(
+        './main --host {host} --port {port} --user user_with_double_sha1 --password abacaba --database '
+        'default'.format(host=server_address, port=server_port), demux=True)
     assert code == 0
     assert stdout == reference
 
 
 def test_php_client(server_address, php_container):
     # type: (str, Container) -> None
-    code, (stdout, stderr) = php_container.exec_run('php -f test.php {host} {port} default 123'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = php_container.exec_run(
+        'php -f test.php {host} {port} default 123'.format(host=server_address, port=server_port), demux=True)
     assert code == 0
     assert stdout == 'tables\n'
 
-    code, (stdout, stderr) = php_container.exec_run('php -f test_ssl.php {host} {port} default 123'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = php_container.exec_run(
+        'php -f test_ssl.php {host} {port} default 123'.format(host=server_address, port=server_port), demux=True)
     assert code == 0
     assert stdout == 'tables\n'
 
-    code, (stdout, stderr) = php_container.exec_run('php -f test.php {host} {port} user_with_double_sha1 abacaba'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = php_container.exec_run(
+        'php -f test.php {host} {port} user_with_double_sha1 abacaba'.format(host=server_address, port=server_port),
+        demux=True)
     assert code == 0
     assert stdout == 'tables\n'
 
-    code, (stdout, stderr) = php_container.exec_run('php -f test_ssl.php {host} {port} user_with_double_sha1 abacaba'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = php_container.exec_run(
+        'php -f test_ssl.php {host} {port} user_with_double_sha1 abacaba'.format(host=server_address, port=server_port),
+        demux=True)
     assert code == 0
     assert stdout == 'tables\n'
 
 
 def test_mysqljs_client(server_address, nodejs_container):
-    code, (_, stderr) = nodejs_container.exec_run('node test.js {host} {port} user_with_sha256 abacaba'.format(host=server_address, port=server_port), demux=True)
+    code, (_, stderr) = nodejs_container.exec_run(
+        'node test.js {host} {port} user_with_sha256 abacaba'.format(host=server_address, port=server_port), demux=True)
     assert code == 1
     assert 'MySQL is requesting the sha256_password authentication method, which is not supported.' in stderr
 
-    code, (_, stderr) = nodejs_container.exec_run('node test.js {host} {port} user_with_empty_password ""'.format(host=server_address, port=server_port), demux=True)
+    code, (_, stderr) = nodejs_container.exec_run(
+        'node test.js {host} {port} user_with_empty_password ""'.format(host=server_address, port=server_port),
+        demux=True)
     assert code == 0
 
-    code, (_, _) = nodejs_container.exec_run('node test.js {host} {port} user_with_double_sha1 abacaba'.format(host=server_address, port=server_port), demux=True)
+    code, (_, _) = nodejs_container.exec_run(
+        'node test.js {host} {port} user_with_double_sha1 abacaba'.format(host=server_address, port=server_port),
+        demux=True)
     assert code == 0
 
-    code, (_, _) = nodejs_container.exec_run('node test.js {host} {port} user_with_empty_password 123'.format(host=server_address, port=server_port), demux=True)
+    code, (_, _) = nodejs_container.exec_run(
+        'node test.js {host} {port} user_with_empty_password 123'.format(host=server_address, port=server_port),
+        demux=True)
     assert code == 1
 
 
@@ -411,31 +437,36 @@ def test_java_client(server_address, java_container):
         reference = fp.read()
 
     # database not exists exception.
-    code, (stdout, stderr) = java_container.exec_run('java JavaConnectorTest --host {host} --port {port} --user user_with_empty_password --database '
-                                                       'abc'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = java_container.exec_run(
+        'java JavaConnectorTest --host {host} --port {port} --user user_with_empty_password --database '
+        'abc'.format(host=server_address, port=server_port), demux=True)
     assert code == 1
 
     # empty password passed.
-    code, (stdout, stderr) = java_container.exec_run('java JavaConnectorTest --host {host} --port {port} --user user_with_empty_password --database '
-                                                       'default'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = java_container.exec_run(
+        'java JavaConnectorTest --host {host} --port {port} --user user_with_empty_password --database '
+        'default'.format(host=server_address, port=server_port), demux=True)
     assert code == 0
     assert stdout == reference
 
     # non-empty password passed.
-    code, (stdout, stderr) = java_container.exec_run('java JavaConnectorTest --host {host} --port {port} --user default --password 123 --database '
-                                                       'default'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = java_container.exec_run(
+        'java JavaConnectorTest --host {host} --port {port} --user default --password 123 --database '
+        'default'.format(host=server_address, port=server_port), demux=True)
     assert code == 0
     assert stdout == reference
 
     # double-sha1 password passed.
-    code, (stdout, stderr) = java_container.exec_run('java JavaConnectorTest --host {host} --port {port} --user user_with_double_sha1 --password abacaba  --database '
-                                                       'default'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = java_container.exec_run(
+        'java JavaConnectorTest --host {host} --port {port} --user user_with_double_sha1 --password abacaba  --database '
+        'default'.format(host=server_address, port=server_port), demux=True)
     assert code == 0
     assert stdout == reference
 
 
 def test_types(server_address):
-    client = pymysql.connections.Connection(host=server_address, user='default', password='123', database='default', port=server_port)
+    client = pymysql.connections.Connection(host=server_address, user='default', password='123', database='default',
+                                            port=server_port)
 
     cursor = client.cursor(pymysql.cursors.DictCursor)
     cursor.execute(
diff --git a/tests/integration/test_no_local_metadata_node/test.py b/tests/integration/test_no_local_metadata_node/test.py
index ef240cd710c..ae69f5e1384 100644
--- a/tests/integration/test_no_local_metadata_node/test.py
+++ b/tests/integration/test_no_local_metadata_node/test.py
@@ -1,4 +1,3 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
@@ -6,6 +5,7 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
diff --git a/tests/integration/test_non_default_compression/test.py b/tests/integration/test_non_default_compression/test.py
index 2c099e84e89..4706d8efbdd 100644
--- a/tests/integration/test_non_default_compression/test.py
+++ b/tests/integration/test_non_default_compression/test.py
@@ -1,17 +1,23 @@
-import time
-import pytest
-import string
 import random
+import string
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 
-node1 = cluster.add_instance('node1', main_configs=['configs/zstd_compression_by_default.xml'], user_configs=['configs/allow_suspicious_codecs.xml'])
-node2 = cluster.add_instance('node2', main_configs=['configs/lz4hc_compression_by_default.xml'], user_configs=['configs/allow_suspicious_codecs.xml'])
-node3 = cluster.add_instance('node3', main_configs=['configs/custom_compression_by_default.xml'], user_configs=['configs/allow_suspicious_codecs.xml'])
-node4 = cluster.add_instance('node4', user_configs=['configs/enable_uncompressed_cache.xml', 'configs/allow_suspicious_codecs.xml'])
-node5 = cluster.add_instance('node5', main_configs=['configs/zstd_compression_by_default.xml'], user_configs=['configs/enable_uncompressed_cache.xml', 'configs/allow_suspicious_codecs.xml'])
+node1 = cluster.add_instance('node1', main_configs=['configs/zstd_compression_by_default.xml'],
+                             user_configs=['configs/allow_suspicious_codecs.xml'])
+node2 = cluster.add_instance('node2', main_configs=['configs/lz4hc_compression_by_default.xml'],
+                             user_configs=['configs/allow_suspicious_codecs.xml'])
+node3 = cluster.add_instance('node3', main_configs=['configs/custom_compression_by_default.xml'],
+                             user_configs=['configs/allow_suspicious_codecs.xml'])
+node4 = cluster.add_instance('node4', user_configs=['configs/enable_uncompressed_cache.xml',
+                                                    'configs/allow_suspicious_codecs.xml'])
+node5 = cluster.add_instance('node5', main_configs=['configs/zstd_compression_by_default.xml'],
+                             user_configs=['configs/enable_uncompressed_cache.xml',
+                                           'configs/allow_suspicious_codecs.xml'])
+
 
 @pytest.fixture(scope="module")
 def start_cluster():
@@ -33,17 +39,23 @@ def test_preconfigured_default_codec(start_cluster):
             somecolumn Float64
         ) ENGINE = MergeTree() PARTITION BY somedate ORDER BY id SETTINGS index_granularity = 2;
         """)
-        node.query("INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, 'hello', 88.88), (toDate('2018-10-12'), 100002, 'world', 99.99), (toDate('2018-10-12'), 1111, '!', 777.777)")
+        node.query(
+            "INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, 'hello', 88.88), (toDate('2018-10-12'), 100002, 'world', 99.99), (toDate('2018-10-12'), 1111, '!', 777.777)")
         assert node.query("SELECT COUNT(*) FROM compression_codec_multiple_with_key WHERE id % 2 == 0") == "2\n"
-        assert node.query("SELECT DISTINCT somecolumn FROM compression_codec_multiple_with_key ORDER BY id") == "777.777\n88.88\n99.99\n"
-        assert node.query("SELECT data FROM compression_codec_multiple_with_key WHERE id >= 1112 AND somedate = toDate('2018-10-12') AND somecolumn <= 100") == "hello\nworld\n"
+        assert node.query(
+            "SELECT DISTINCT somecolumn FROM compression_codec_multiple_with_key ORDER BY id") == "777.777\n88.88\n99.99\n"
+        assert node.query(
+            "SELECT data FROM compression_codec_multiple_with_key WHERE id >= 1112 AND somedate = toDate('2018-10-12') AND somecolumn <= 100") == "hello\nworld\n"
 
-        node.query("INSERT INTO compression_codec_multiple_with_key SELECT toDate('2018-10-12'), number, toString(number), 1.0 FROM system.numbers LIMIT 10000")
+        node.query(
+            "INSERT INTO compression_codec_multiple_with_key SELECT toDate('2018-10-12'), number, toString(number), 1.0 FROM system.numbers LIMIT 10000")
 
         assert node.query("SELECT COUNT(id) FROM compression_codec_multiple_with_key WHERE id % 10 == 0") == "1001\n"
-        assert node.query("SELECT SUM(somecolumn) FROM compression_codec_multiple_with_key") == str(777.777 + 88.88 + 99.99 + 1.0 * 10000) + "\n"
+        assert node.query("SELECT SUM(somecolumn) FROM compression_codec_multiple_with_key") == str(
+            777.777 + 88.88 + 99.99 + 1.0 * 10000) + "\n"
         assert node.query("SELECT count(*) FROM compression_codec_multiple_with_key GROUP BY somedate") == "10003\n"
 
+
 def test_preconfigured_custom_codec(start_cluster):
     node3.query("""
     CREATE TABLE compression_codec_multiple_with_key (
@@ -54,23 +66,39 @@ def test_preconfigured_custom_codec(start_cluster):
     ) ENGINE = MergeTree() PARTITION BY somedate ORDER BY id SETTINGS index_granularity = 2;
     """)
 
-    node3.query("INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, 'hello', 88.88), (toDate('2018-10-12'), 100002, 'world', 99.99), (toDate('2018-10-12'), 1111, '!', 777.777)")
+    node3.query(
+        "INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, 'hello', 88.88), (toDate('2018-10-12'), 100002, 'world', 99.99), (toDate('2018-10-12'), 1111, '!', 777.777)")
     assert node3.query("SELECT COUNT(*) FROM compression_codec_multiple_with_key WHERE id % 2 == 0") == "2\n"
-    assert node3.query("SELECT DISTINCT somecolumn FROM compression_codec_multiple_with_key ORDER BY id") == "777.777\n88.88\n99.99\n"
-    assert node3.query("SELECT data FROM compression_codec_multiple_with_key WHERE id >= 1112 AND somedate = toDate('2018-10-12') AND somecolumn <= 100") == "hello\nworld\n"
+    assert node3.query(
+        "SELECT DISTINCT somecolumn FROM compression_codec_multiple_with_key ORDER BY id") == "777.777\n88.88\n99.99\n"
+    assert node3.query(
+        "SELECT data FROM compression_codec_multiple_with_key WHERE id >= 1112 AND somedate = toDate('2018-10-12') AND somecolumn <= 100") == "hello\nworld\n"
 
-    node3.query("INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, '{}', 88.88)".format(''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(10000))))
+    node3.query(
+        "INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, '{}', 88.88)".format(
+            ''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(10000))))
 
     node3.query("OPTIMIZE TABLE compression_codec_multiple_with_key FINAL")
-    assert node3.query("SELECT max(length(data)) from compression_codec_multiple_with_key GROUP BY data ORDER BY max(length(data)) DESC LIMIT 1") == "10000\n"
+    assert node3.query(
+        "SELECT max(length(data)) from compression_codec_multiple_with_key GROUP BY data ORDER BY max(length(data)) DESC LIMIT 1") == "10000\n"
 
     for i in xrange(10):
-        node3.query("INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), {}, '{}', 88.88)".format(i, ''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(10000))))
+        node3.query(
+            "INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), {}, '{}', 88.88)".format(i,
+                                                                                                                   ''.join(
+                                                                                                                       random.choice(
+                                                                                                                           string.ascii_uppercase + string.digits)
+                                                                                                                       for
+                                                                                                                       _
+                                                                                                                       in
+                                                                                                                       range(
+                                                                                                                           10000))))
 
     node3.query("OPTIMIZE TABLE compression_codec_multiple_with_key FINAL")
 
     assert node3.query("SELECT COUNT(*) from compression_codec_multiple_with_key WHERE length(data) = 10000") == "11\n"
 
+
 def test_uncompressed_cache_custom_codec(start_cluster):
     node4.query("""
     CREATE TABLE compression_codec_multiple_with_key (
@@ -81,12 +109,17 @@ def test_uncompressed_cache_custom_codec(start_cluster):
     ) ENGINE = MergeTree() PARTITION BY somedate ORDER BY id SETTINGS index_granularity = 2;
     """)
 
-    node4.query("INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, '{}', 88.88)".format(''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(10000))))
+    node4.query(
+        "INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, '{}', 88.88)".format(
+            ''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(10000))))
 
     # two equal requests one by one, to get into UncompressedCache for the first block
-    assert node4.query("SELECT max(length(data)) from compression_codec_multiple_with_key GROUP BY data ORDER BY max(length(data)) DESC LIMIT 1") == "10000\n"
+    assert node4.query(
+        "SELECT max(length(data)) from compression_codec_multiple_with_key GROUP BY data ORDER BY max(length(data)) DESC LIMIT 1") == "10000\n"
+
+    assert node4.query(
+        "SELECT max(length(data)) from compression_codec_multiple_with_key GROUP BY data ORDER BY max(length(data)) DESC LIMIT 1") == "10000\n"
 
-    assert node4.query("SELECT max(length(data)) from compression_codec_multiple_with_key GROUP BY data ORDER BY max(length(data)) DESC LIMIT 1") == "10000\n"
 
 def test_uncompressed_cache_plus_zstd_codec(start_cluster):
     node5.query("""
@@ -98,6 +131,9 @@ def test_uncompressed_cache_plus_zstd_codec(start_cluster):
     ) ENGINE = MergeTree() PARTITION BY somedate ORDER BY id SETTINGS index_granularity = 2;
     """)
 
-    node5.query("INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, '{}', 88.88)".format('a' * 10000))
+    node5.query(
+        "INSERT INTO compression_codec_multiple_with_key VALUES(toDate('2018-10-12'), 100000, '{}', 88.88)".format(
+            'a' * 10000))
 
-    assert node5.query("SELECT max(length(data)) from compression_codec_multiple_with_key GROUP BY data ORDER BY max(length(data)) DESC LIMIT 1") == "10000\n"
+    assert node5.query(
+        "SELECT max(length(data)) from compression_codec_multiple_with_key GROUP BY data ORDER BY max(length(data)) DESC LIMIT 1") == "10000\n"
diff --git a/tests/integration/test_odbc_interaction/test.py b/tests/integration/test_odbc_interaction/test.py
index 0577917ded8..f527b4cc66e 100644
--- a/tests/integration/test_odbc_interaction/test.py
+++ b/tests/integration/test_odbc_interaction/test.py
@@ -1,17 +1,20 @@
 import time
-import pytest
 
-import os
-import pymysql.cursors
 import psycopg2
-from psycopg2.extensions import ISOLATION_LEVEL_AUTOCOMMIT
+import pymysql.cursors
+import pytest
 from helpers.cluster import ClickHouseCluster
-
+from psycopg2.extensions import ISOLATION_LEVEL_AUTOCOMMIT
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', with_odbc_drivers=True, with_mysql=True, main_configs=['configs/openssl.xml','configs/odbc_logging.xml','configs/enable_dictionaries.xml','configs/dictionaries/sqlite3_odbc_hashed_dictionary.xml','configs/dictionaries/sqlite3_odbc_cached_dictionary.xml','configs/dictionaries/postgres_odbc_hashed_dictionary.xml'], stay_alive=True)
+node1 = cluster.add_instance('node1', with_odbc_drivers=True, with_mysql=True,
+                             main_configs=['configs/openssl.xml', 'configs/odbc_logging.xml',
+                                           'configs/enable_dictionaries.xml',
+                                           'configs/dictionaries/sqlite3_odbc_hashed_dictionary.xml',
+                                           'configs/dictionaries/sqlite3_odbc_cached_dictionary.xml',
+                                           'configs/dictionaries/postgres_odbc_hashed_dictionary.xml'], stay_alive=True)
 
-create_table_sql_template =   """
+create_table_sql_template = """
     CREATE TABLE `clickhouse`.`{}` (
     `id` int(11) NOT NULL,
     `name` varchar(50) NOT NULL,
@@ -20,19 +23,24 @@ create_table_sql_template =   """
     `column_x` int default NULL,
     PRIMARY KEY (`id`)) ENGINE=InnoDB;
     """
+
+
 def get_mysql_conn():
     conn = pymysql.connect(user='root', password='clickhouse', host='127.0.0.1', port=3308)
     return conn
 
+
 def create_mysql_db(conn, name):
     with conn.cursor() as cursor:
         cursor.execute(
             "CREATE DATABASE {} DEFAULT CHARACTER SET 'utf8'".format(name))
 
+
 def create_mysql_table(conn, table_name):
     with conn.cursor() as cursor:
         cursor.execute(create_table_sql_template.format(table_name))
 
+
 def get_postgres_conn():
     conn_string = "host='localhost' user='postgres' password='mysecretpassword'"
     conn = psycopg2.connect(conn_string)
@@ -40,10 +48,12 @@ def get_postgres_conn():
     conn.autocommit = True
     return conn
 
+
 def create_postgres_db(conn, name):
     cursor = conn.cursor()
     cursor.execute("CREATE SCHEMA {}".format(name))
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -51,10 +61,18 @@ def started_cluster():
         sqlite_db = node1.odbc_drivers["SQLite3"]["Database"]
 
         print "sqlite data received"
-        node1.exec_in_container(["bash", "-c", "echo 'CREATE TABLE t1(x INTEGER PRIMARY KEY ASC, y, z);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
-        node1.exec_in_container(["bash", "-c", "echo 'CREATE TABLE t2(X INTEGER PRIMARY KEY ASC, Y, Z);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
-        node1.exec_in_container(["bash", "-c", "echo 'CREATE TABLE t3(X INTEGER PRIMARY KEY ASC, Y, Z);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
-        node1.exec_in_container(["bash", "-c", "echo 'CREATE TABLE t4(X INTEGER PRIMARY KEY ASC, Y, Z);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
+        node1.exec_in_container(
+            ["bash", "-c", "echo 'CREATE TABLE t1(x INTEGER PRIMARY KEY ASC, y, z);' | sqlite3 {}".format(sqlite_db)],
+            privileged=True, user='root')
+        node1.exec_in_container(
+            ["bash", "-c", "echo 'CREATE TABLE t2(X INTEGER PRIMARY KEY ASC, Y, Z);' | sqlite3 {}".format(sqlite_db)],
+            privileged=True, user='root')
+        node1.exec_in_container(
+            ["bash", "-c", "echo 'CREATE TABLE t3(X INTEGER PRIMARY KEY ASC, Y, Z);' | sqlite3 {}".format(sqlite_db)],
+            privileged=True, user='root')
+        node1.exec_in_container(
+            ["bash", "-c", "echo 'CREATE TABLE t4(X INTEGER PRIMARY KEY ASC, Y, Z);' | sqlite3 {}".format(sqlite_db)],
+            privileged=True, user='root')
         print "sqlite tables created"
         mysql_conn = get_mysql_conn()
         print "mysql connection received"
@@ -69,7 +87,8 @@ def started_cluster():
         print "postgres db created"
 
         cursor = postgres_conn.cursor()
-        cursor.execute("create table if not exists clickhouse.test_table (column1 int primary key, column2 varchar(40) not null)")
+        cursor.execute(
+            "create table if not exists clickhouse.test_table (column1 int primary key, column2 varchar(40) not null)")
 
         yield cluster
 
@@ -79,6 +98,7 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_mysql_simple_select_works(started_cluster):
     mysql_setup = node1.odbc_drivers["MySQL"]
 
@@ -88,17 +108,25 @@ def test_mysql_simple_select_works(started_cluster):
 
     # Check that NULL-values are handled correctly by the ODBC-bridge
     with conn.cursor() as cursor:
-        cursor.execute("INSERT INTO clickhouse.{} VALUES(50, 'null-guy', 127, 255, NULL), (100, 'non-null-guy', 127, 255, 511);".format(table_name))
+        cursor.execute(
+            "INSERT INTO clickhouse.{} VALUES(50, 'null-guy', 127, 255, NULL), (100, 'non-null-guy', 127, 255, 511);".format(
+                table_name))
         conn.commit()
-    assert node1.query("SELECT column_x FROM odbc('DSN={}', '{}')".format(mysql_setup["DSN"], table_name), settings={"external_table_functions_use_nulls": "1"}) == '\\N\n511\n'
-    assert node1.query("SELECT column_x FROM odbc('DSN={}', '{}')".format(mysql_setup["DSN"], table_name), settings={"external_table_functions_use_nulls": "0"}) == '0\n511\n'
+    assert node1.query("SELECT column_x FROM odbc('DSN={}', '{}')".format(mysql_setup["DSN"], table_name),
+                       settings={"external_table_functions_use_nulls": "1"}) == '\\N\n511\n'
+    assert node1.query("SELECT column_x FROM odbc('DSN={}', '{}')".format(mysql_setup["DSN"], table_name),
+                       settings={"external_table_functions_use_nulls": "0"}) == '0\n511\n'
 
     node1.query('''
 CREATE TABLE {}(id UInt32, name String, age UInt32, money UInt32, column_x Nullable(UInt32)) ENGINE = MySQL('mysql1:3306', 'clickhouse', '{}', 'root', 'clickhouse');
 '''.format(table_name, table_name))
 
-    node1.query("INSERT INTO {}(id, name, money, column_x) select number, concat('name_', toString(number)), 3, NULL from numbers(49) ".format(table_name))
-    node1.query("INSERT INTO {}(id, name, money, column_x) select number, concat('name_', toString(number)), 3, 42 from numbers(51, 49) ".format(table_name))
+    node1.query(
+        "INSERT INTO {}(id, name, money, column_x) select number, concat('name_', toString(number)), 3, NULL from numbers(49) ".format(
+            table_name))
+    node1.query(
+        "INSERT INTO {}(id, name, money, column_x) select number, concat('name_', toString(number)), 3, 42 from numbers(51, 49) ".format(
+            table_name))
 
     assert node1.query("SELECT COUNT () FROM {} WHERE column_x IS NOT NULL".format(table_name)) == '50\n'
     assert node1.query("SELECT COUNT () FROM {} WHERE column_x IS NULL".format(table_name)) == '50\n'
@@ -110,6 +138,7 @@ CREATE TABLE {}(id UInt32, name String, age UInt32, money UInt32, column_x Nulla
 
     conn.close()
 
+
 def test_mysql_insert(started_cluster):
     mysql_setup = node1.odbc_drivers["MySQL"]
     table_name = 'test_insert'
@@ -117,20 +146,26 @@ def test_mysql_insert(started_cluster):
     create_mysql_table(conn, table_name)
     odbc_args = "'DSN={}', '{}', '{}'".format(mysql_setup["DSN"], mysql_setup["Database"], table_name)
 
-    node1.query("create table mysql_insert (id Int64, name String, age UInt8, money Float, column_x Nullable(Int16)) Engine=ODBC({})".format(odbc_args))
+    node1.query(
+        "create table mysql_insert (id Int64, name String, age UInt8, money Float, column_x Nullable(Int16)) Engine=ODBC({})".format(
+            odbc_args))
     node1.query("insert into mysql_insert values (1, 'test', 11, 111, 1111), (2, 'odbc', 22, 222, NULL)")
     assert node1.query("select * from mysql_insert") == "1\ttest\t11\t111\t1111\n2\todbc\t22\t222\t\\N\n"
 
     node1.query("insert into table function odbc({}) values (3, 'insert', 33, 333, 3333)".format(odbc_args))
-    node1.query("insert into table function odbc({}) (id, name, age, money) select id*4, upper(name), age*4, money*4 from odbc({}) where id=1".format(odbc_args, odbc_args))
-    assert node1.query("select * from mysql_insert where id in (3, 4)") == "3\tinsert\t33\t333\t3333\n4\tTEST\t44\t444\t\\N\n"
+    node1.query(
+        "insert into table function odbc({}) (id, name, age, money) select id*4, upper(name), age*4, money*4 from odbc({}) where id=1".format(
+            odbc_args, odbc_args))
+    assert node1.query(
+        "select * from mysql_insert where id in (3, 4)") == "3\tinsert\t33\t333\t3333\n4\tTEST\t44\t444\t\\N\n"
 
 
 def test_sqlite_simple_select_function_works(started_cluster):
     sqlite_setup = node1.odbc_drivers["SQLite3"]
     sqlite_db = sqlite_setup["Database"]
 
-    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t1 values(1, 2, 3);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
+    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t1 values(1, 2, 3);' | sqlite3 {}".format(sqlite_db)],
+                            privileged=True, user='root')
     assert node1.query("select * from odbc('DSN={}', '{}')".format(sqlite_setup["DSN"], 't1')) == "1\t2\t3\n"
 
     assert node1.query("select y from odbc('DSN={}', '{}')".format(sqlite_setup["DSN"], 't1')) == "2\n"
@@ -138,14 +173,18 @@ def test_sqlite_simple_select_function_works(started_cluster):
     assert node1.query("select x from odbc('DSN={}', '{}')".format(sqlite_setup["DSN"], 't1')) == "1\n"
     assert node1.query("select x, y from odbc('DSN={}', '{}')".format(sqlite_setup["DSN"], 't1')) == "1\t2\n"
     assert node1.query("select z, x, y from odbc('DSN={}', '{}')".format(sqlite_setup["DSN"], 't1')) == "3\t1\t2\n"
-    assert node1.query("select count(), sum(x) from odbc('DSN={}', '{}') group by x".format(sqlite_setup["DSN"], 't1')) == "1\t1\n"
+    assert node1.query(
+        "select count(), sum(x) from odbc('DSN={}', '{}') group by x".format(sqlite_setup["DSN"], 't1')) == "1\t1\n"
+
 
 def test_sqlite_simple_select_storage_works(started_cluster):
     sqlite_setup = node1.odbc_drivers["SQLite3"]
     sqlite_db = sqlite_setup["Database"]
 
-    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t4 values(1, 2, 3);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
-    node1.query("create table SqliteODBC (x Int32, y String, z String) engine = ODBC('DSN={}', '', 't4')".format(sqlite_setup["DSN"]))
+    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t4 values(1, 2, 3);' | sqlite3 {}".format(sqlite_db)],
+                            privileged=True, user='root')
+    node1.query("create table SqliteODBC (x Int32, y String, z String) engine = ODBC('DSN={}', '', 't4')".format(
+        sqlite_setup["DSN"]))
 
     assert node1.query("select * from SqliteODBC") == "1\t2\t3\n"
     assert node1.query("select y from SqliteODBC") == "2\n"
@@ -155,32 +194,38 @@ def test_sqlite_simple_select_storage_works(started_cluster):
     assert node1.query("select z, x, y from SqliteODBC") == "3\t1\t2\n"
     assert node1.query("select count(), sum(x) from SqliteODBC group by x") == "1\t1\n"
 
+
 def test_sqlite_odbc_hashed_dictionary(started_cluster):
-    sqlite_db =  node1.odbc_drivers["SQLite3"]["Database"]
-    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t2 values(1, 2, 3);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
+    sqlite_db = node1.odbc_drivers["SQLite3"]["Database"]
+    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t2 values(1, 2, 3);' | sqlite3 {}".format(sqlite_db)],
+                            privileged=True, user='root')
 
     assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(1))") == "3\n"
-    assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(200))") == "1\n" # default
+    assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(200))") == "1\n"  # default
 
-    time.sleep(5) # first reload
-    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t2 values(200, 2, 7);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
+    time.sleep(5)  # first reload
+    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t2 values(200, 2, 7);' | sqlite3 {}".format(sqlite_db)],
+                            privileged=True, user='root')
 
     # No reload because of invalidate query
     time.sleep(5)
     assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(1))") == "3\n"
-    assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(200))") == "1\n" # still default
+    assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(200))") == "1\n"  # still default
 
-    node1.exec_in_container(["bash", "-c", "echo 'REPLACE INTO t2 values(1, 2, 5);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
+    node1.exec_in_container(["bash", "-c", "echo 'REPLACE INTO t2 values(1, 2, 5);' | sqlite3 {}".format(sqlite_db)],
+                            privileged=True, user='root')
 
     # waiting for reload
     time.sleep(5)
 
     assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(1))") == "5\n"
-    assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(200))") == "7\n" # new value
+    assert node1.query("select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(200))") == "7\n"  # new value
+
 
 def test_sqlite_odbc_cached_dictionary(started_cluster):
-    sqlite_db =  node1.odbc_drivers["SQLite3"]["Database"]
-    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t3 values(1, 2, 3);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
+    sqlite_db = node1.odbc_drivers["SQLite3"]["Database"]
+    node1.exec_in_container(["bash", "-c", "echo 'INSERT INTO t3 values(1, 2, 3);' | sqlite3 {}".format(sqlite_db)],
+                            privileged=True, user='root')
 
     assert node1.query("select dictGetUInt8('sqlite3_odbc_cached', 'Z', toUInt64(1))") == "3\n"
 
@@ -188,16 +233,19 @@ def test_sqlite_odbc_cached_dictionary(started_cluster):
     node1.exec_in_container(["bash", "-c", "chmod a+rw /tmp"], privileged=True, user='root')
     node1.exec_in_container(["bash", "-c", "chmod a+rw {}".format(sqlite_db)], privileged=True, user='root')
 
-    node1.query("insert into table function odbc('DSN={};', '', 't3') values (200, 2, 7)".format(node1.odbc_drivers["SQLite3"]["DSN"]))
+    node1.query("insert into table function odbc('DSN={};', '', 't3') values (200, 2, 7)".format(
+        node1.odbc_drivers["SQLite3"]["DSN"]))
 
-    assert node1.query("select dictGetUInt8('sqlite3_odbc_cached', 'Z', toUInt64(200))") == "7\n" # new value
+    assert node1.query("select dictGetUInt8('sqlite3_odbc_cached', 'Z', toUInt64(200))") == "7\n"  # new value
 
-    node1.exec_in_container(["bash", "-c", "echo 'REPLACE INTO t3 values(1, 2, 12);' | sqlite3 {}".format(sqlite_db)], privileged=True, user='root')
+    node1.exec_in_container(["bash", "-c", "echo 'REPLACE INTO t3 values(1, 2, 12);' | sqlite3 {}".format(sqlite_db)],
+                            privileged=True, user='root')
 
     time.sleep(5)
 
     assert node1.query("select dictGetUInt8('sqlite3_odbc_cached', 'Z', toUInt64(1))") == "12\n"
 
+
 def test_postgres_odbc_hached_dictionary_with_schema(started_cluster):
     conn = get_postgres_conn()
     cursor = conn.cursor()
@@ -206,6 +254,7 @@ def test_postgres_odbc_hached_dictionary_with_schema(started_cluster):
     assert node1.query("select dictGetString('postgres_odbc_hashed', 'column2', toUInt64(1))") == "hello\n"
     assert node1.query("select dictGetString('postgres_odbc_hashed', 'column2', toUInt64(2))") == "world\n"
 
+
 def test_postgres_odbc_hached_dictionary_no_tty_pipe_overflow(started_cluster):
     conn = get_postgres_conn()
     cursor = conn.cursor()
@@ -218,6 +267,7 @@ def test_postgres_odbc_hached_dictionary_no_tty_pipe_overflow(started_cluster):
 
     assert node1.query("select dictGetString('postgres_odbc_hashed', 'column2', toUInt64(3))") == "xxx\n"
 
+
 def test_postgres_insert(started_cluster):
     conn = get_postgres_conn()
     conn.cursor().execute("truncate table clickhouse.test_table")
@@ -226,13 +276,17 @@ def test_postgres_insert(started_cluster):
     # postgres .yml file). This is needed to check parsing, validation and
     # reconstruction of connection string.
 
-    node1.query("create table pg_insert (column1 UInt8, column2 String) engine=ODBC('DSN=postgresql_odbc;Servername=postgre-sql.local', 'clickhouse', 'test_table')")
+    node1.query(
+        "create table pg_insert (column1 UInt8, column2 String) engine=ODBC('DSN=postgresql_odbc;Servername=postgre-sql.local', 'clickhouse', 'test_table')")
     node1.query("insert into pg_insert values (1, 'hello'), (2, 'world')")
     assert node1.query("select * from pg_insert") == '1\thello\n2\tworld\n'
     node1.query("insert into table function odbc('DSN=postgresql_odbc;', 'clickhouse', 'test_table') format CSV 3,test")
-    node1.query("insert into table function odbc('DSN=postgresql_odbc;Servername=postgre-sql.local', 'clickhouse', 'test_table') select number, 's' || toString(number) from numbers (4, 7)")
+    node1.query(
+        "insert into table function odbc('DSN=postgresql_odbc;Servername=postgre-sql.local', 'clickhouse', 'test_table') select number, 's' || toString(number) from numbers (4, 7)")
     assert node1.query("select sum(column1), count(column1) from pg_insert") == "55\t10\n"
-    assert node1.query("select sum(n), count(n) from (select (*,).1 as n from (select * from odbc('DSN=postgresql_odbc;', 'clickhouse', 'test_table')))") == "55\t10\n"
+    assert node1.query(
+        "select sum(n), count(n) from (select (*,).1 as n from (select * from odbc('DSN=postgresql_odbc;', 'clickhouse', 'test_table')))") == "55\t10\n"
+
 
 def test_bridge_dies_with_parent(started_cluster):
     node1.query("select dictGetString('postgres_odbc_hashed', 'column2', toUInt64(1))")
@@ -251,13 +305,14 @@ def test_bridge_dies_with_parent(started_cluster):
         time.sleep(1)
 
     for i in range(5):
-        time.sleep(1) # just for sure, that odbc-bridge caught signal
+        time.sleep(1)  # just for sure, that odbc-bridge caught signal
         bridge_pid = node1.get_process_pid("odbc-bridge")
         if bridge_pid is None:
             break
 
     if bridge_pid:
-        out = node1.exec_in_container(["gdb", "-p", str(bridge_pid), "--ex", "thread apply all bt", "--ex", "q"], privileged=True, user='root')
+        out = node1.exec_in_container(["gdb", "-p", str(bridge_pid), "--ex", "thread apply all bt", "--ex", "q"],
+                                      privileged=True, user='root')
         print("Bridge is running, gdb output:")
         print(out)
 
diff --git a/tests/integration/test_old_versions/test.py b/tests/integration/test_old_versions/test.py
index 0336a1196c4..1870ecf4c9d 100644
--- a/tests/integration/test_old_versions/test.py
+++ b/tests/integration/test_old_versions/test.py
@@ -1,28 +1,30 @@
-
-import time
-import os
 import pytest
 
 from helpers.cluster import ClickHouseCluster
-from multiprocessing.dummy import Pool
-from helpers.client import QueryRuntimeException, QueryTimeoutExceedException
 from helpers.test_tools import assert_eq_with_retry
 
-
 cluster = ClickHouseCluster(__file__)
-node18_14 = cluster.add_instance('node18_14', image='yandex/clickhouse-server', tag='18.14.19', with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
-node19_1 = cluster.add_instance('node19_1', image='yandex/clickhouse-server', tag='19.1.16', with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
-node19_4 = cluster.add_instance('node19_4', image='yandex/clickhouse-server', tag='19.4.5.35', with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
-node19_8 = cluster.add_instance('node19_8', image='yandex/clickhouse-server', tag='19.8.3.8', with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
-node19_11 = cluster.add_instance('node19_11', image='yandex/clickhouse-server', tag='19.11.13.74', with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
-node19_13 = cluster.add_instance('node19_13', image='yandex/clickhouse-server', tag='19.13.7.57', with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
-node19_16 = cluster.add_instance('node19_16', image='yandex/clickhouse-server', tag='19.16.2.2', with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
+node18_14 = cluster.add_instance('node18_14', image='yandex/clickhouse-server', tag='18.14.19',
+                                 with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
+node19_1 = cluster.add_instance('node19_1', image='yandex/clickhouse-server', tag='19.1.16', with_installed_binary=True,
+                                main_configs=["configs/config.d/test_cluster.xml"])
+node19_4 = cluster.add_instance('node19_4', image='yandex/clickhouse-server', tag='19.4.5.35',
+                                with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
+node19_8 = cluster.add_instance('node19_8', image='yandex/clickhouse-server', tag='19.8.3.8',
+                                with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
+node19_11 = cluster.add_instance('node19_11', image='yandex/clickhouse-server', tag='19.11.13.74',
+                                 with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
+node19_13 = cluster.add_instance('node19_13', image='yandex/clickhouse-server', tag='19.13.7.57',
+                                 with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
+node19_16 = cluster.add_instance('node19_16', image='yandex/clickhouse-server', tag='19.16.2.2',
+                                 with_installed_binary=True, main_configs=["configs/config.d/test_cluster.xml"])
 old_nodes = [node18_14, node19_1, node19_4, node19_8, node19_11, node19_13, node19_16]
 new_node = cluster.add_instance('node_new')
 
 
 def query_from_one_node_to_another(client_node, server_node, query):
-    client_node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host {} --query {!r}".format(server_node.name, query)])
+    client_node.exec_in_container(
+        ["bash", "-c", "/usr/bin/clickhouse client --host {} --query {!r}".format(server_node.name, query)])
 
 
 @pytest.fixture(scope="module")
@@ -34,7 +36,8 @@ def setup_nodes():
             n.query('''CREATE TABLE test_table (id UInt32, value UInt64) ENGINE = MergeTree() ORDER BY tuple()''')
 
         for n in old_nodes:
-            n.query('''CREATE TABLE dist_table AS test_table ENGINE = Distributed('test_cluster', 'default', 'test_table')''')
+            n.query(
+                '''CREATE TABLE dist_table AS test_table ENGINE = Distributed('test_cluster', 'default', 'test_table')''')
 
         yield cluster
     finally:
@@ -70,5 +73,7 @@ def test_distributed_query_initiator_is_older_than_shard(setup_nodes):
     for i, initiator in enumerate(distributed_query_initiator_old_nodes):
         initiator.query("INSERT INTO dist_table VALUES (3, {})".format(i))
 
-    assert_eq_with_retry(shard, "SELECT COUNT() FROM test_table WHERE id=3", str(len(distributed_query_initiator_old_nodes)))
-    assert_eq_with_retry(initiator, "SELECT COUNT() FROM dist_table WHERE id=3", str(len(distributed_query_initiator_old_nodes)))
+    assert_eq_with_retry(shard, "SELECT COUNT() FROM test_table WHERE id=3",
+                         str(len(distributed_query_initiator_old_nodes)))
+    assert_eq_with_retry(initiator, "SELECT COUNT() FROM dist_table WHERE id=3",
+                         str(len(distributed_query_initiator_old_nodes)))
diff --git a/tests/integration/test_on_cluster_timeouts/test.py b/tests/integration/test_on_cluster_timeouts/test.py
index 965bf8fae1b..544153d0d00 100644
--- a/tests/integration/test_on_cluster_timeouts/test.py
+++ b/tests/integration/test_on_cluster_timeouts/test.py
@@ -1,14 +1,17 @@
 import pytest
 
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
-node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], user_configs=['configs/users_config.xml'], with_zookeeper=True)
-node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'], user_configs=['configs/users_config.xml'], with_zookeeper=True)
-node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml'], user_configs=['configs/users_config.xml'], with_zookeeper=True)
-node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml'], user_configs=['configs/users_config.xml'], with_zookeeper=True)
+node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'],
+                             user_configs=['configs/users_config.xml'], with_zookeeper=True)
+node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'],
+                             user_configs=['configs/users_config.xml'], with_zookeeper=True)
+node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml'],
+                             user_configs=['configs/users_config.xml'], with_zookeeper=True)
+node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml'],
+                             user_configs=['configs/users_config.xml'], with_zookeeper=True)
 
 
 @pytest.fixture(scope="module")
@@ -22,19 +25,24 @@ def started_cluster():
 
 
 def test_long_query(started_cluster):
-    node1.query("CREATE TABLE cluster_table (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/1/cluster_table', '1') ORDER BY tuple()")
-    node2.query("CREATE TABLE cluster_table (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/1/cluster_table', '2') ORDER BY tuple()")
+    node1.query(
+        "CREATE TABLE cluster_table (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/1/cluster_table', '1') ORDER BY tuple()")
+    node2.query(
+        "CREATE TABLE cluster_table (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/1/cluster_table', '2') ORDER BY tuple()")
 
     node1.query("INSERT INTO cluster_table SELECT number, toString(number) FROM numbers(20)")
     node2.query("SYSTEM SYNC REPLICA cluster_table")
 
-    node3.query("CREATE TABLE cluster_table (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/2/cluster_table', '1') ORDER BY tuple()")
+    node3.query(
+        "CREATE TABLE cluster_table (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/2/cluster_table', '1') ORDER BY tuple()")
 
-    node4.query("CREATE TABLE cluster_table (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/2/cluster_table', '2') ORDER BY tuple()")
+    node4.query(
+        "CREATE TABLE cluster_table (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/2/cluster_table', '2') ORDER BY tuple()")
     node3.query("INSERT INTO cluster_table SELECT number, toString(number) FROM numbers(20)")
     node4.query("SYSTEM SYNC REPLICA cluster_table")
 
-    node1.query("ALTER TABLE cluster_table ON CLUSTER 'test_cluster' UPDATE key = 1 WHERE sleepEachRow(1) == 0", settings={"mutations_sync": "2"})
+    node1.query("ALTER TABLE cluster_table ON CLUSTER 'test_cluster' UPDATE key = 1 WHERE sleepEachRow(1) == 0",
+                settings={"mutations_sync": "2"})
 
     assert node1.query("SELECT SUM(key) FROM cluster_table") == "20\n"
     assert node2.query("SELECT SUM(key) FROM cluster_table") == "20\n"
diff --git a/tests/integration/test_part_log_table/test.py b/tests/integration/test_part_log_table/test.py
index 455ca7eed54..63adde432b5 100644
--- a/tests/integration/test_part_log_table/test.py
+++ b/tests/integration/test_part_log_table/test.py
@@ -1,4 +1,3 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
@@ -8,6 +7,7 @@ node1 = cluster.add_instance("node1")
 node2 = cluster.add_instance("node2", main_configs=["configs/config_with_standard_part_log.xml"])
 node3 = cluster.add_instance("node3", main_configs=["configs/config_with_non_standard_part_log.xml"])
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -16,6 +16,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_config_without_part_log(start_cluster):
     assert "Table system.part_log doesn't exist" in node1.query_and_get_error("SELECT * FROM system.part_log")
     node1.query("CREATE TABLE test_table(word String, value UInt64) ENGINE=MergeTree() ORDER BY value")
@@ -24,6 +25,7 @@ def test_config_without_part_log(start_cluster):
     node1.query("SYSTEM FLUSH LOGS")
     assert "Table system.part_log doesn't exist" in node1.query_and_get_error("SELECT * FROM system.part_log")
 
+
 # Note: if part_log is defined, we cannot say when the table will be created - because of metric_log, trace_log, text_log, query_log...
 
 def test_config_with_standard_part_log(start_cluster):
@@ -32,6 +34,7 @@ def test_config_with_standard_part_log(start_cluster):
     node2.query("SYSTEM FLUSH LOGS")
     assert node2.query("SELECT * FROM system.part_log") != ""
 
+
 def test_config_with_non_standard_part_log(start_cluster):
     node3.query("CREATE TABLE test_table(word String, value UInt64) ENGINE=MergeTree() Order by value")
     node3.query("INSERT INTO test_table VALUES ('name', 1)")
diff --git a/tests/integration/test_partition/test.py b/tests/integration/test_partition/test.py
index 80fbe947316..58a37c405cb 100644
--- a/tests/integration/test_partition/test.py
+++ b/tests/integration/test_partition/test.py
@@ -3,7 +3,6 @@ import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
-
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance')
 q = instance.query
@@ -109,7 +108,6 @@ def partition_table_complex(started_cluster):
 
 
 def test_partition_complex(partition_table_complex):
-
     partition_complex_assert_columns_txt()
 
     q("ALTER TABLE test.partition FREEZE")
@@ -131,7 +129,7 @@ def test_partition_complex(partition_table_complex):
     expected = TSV('31\t1\t2\n'
                    '1\t2\t3')
     res = q("SELECT toUInt16(p), k, v1 FROM test.partition ORDER BY k")
-    assert(TSV(res) == expected)
+    assert (TSV(res) == expected)
 
 
 @pytest.fixture
@@ -175,7 +173,7 @@ def test_attach_check_all_parts(attach_check_all_parts_table):
     path_to_detached = path_to_data + 'data/test/attach_partition/detached/'
     exec_bash('mkdir {}'.format(path_to_detached + '0_5_5_0'))
     exec_bash('cp -pr {} {}'.format(path_to_detached + '0_1_1_0', path_to_detached + 'attaching_0_6_6_0'))
-    exec_bash('cp -pr {} {}'.format(path_to_detached + '0_3_3_0', path_to_detached +  'deleting_0_7_7_0'))
+    exec_bash('cp -pr {} {}'.format(path_to_detached + '0_3_3_0', path_to_detached + 'deleting_0_7_7_0'))
 
     error = instance.client.query_and_get_error("ALTER TABLE test.attach_partition ATTACH PARTITION 0")
     assert 0 <= error.find('No columns in part 0_5_5_0')
@@ -224,15 +222,18 @@ def test_drop_detached_parts(drop_detached_parts_table):
     exec_bash('mkdir {}'.format(path_to_detached + 'any_other_name'))
     exec_bash('mkdir {}'.format(path_to_detached + 'prefix_1_2_2_0_0'))
 
-    error = instance.client.query_and_get_error("ALTER TABLE test.drop_detached DROP DETACHED PART '../1_2_2_0'", settings=s)
+    error = instance.client.query_and_get_error("ALTER TABLE test.drop_detached DROP DETACHED PART '../1_2_2_0'",
+                                                settings=s)
     assert 0 <= error.find('Invalid part name')
 
     q("ALTER TABLE test.drop_detached DROP DETACHED PART '0_1_1_0'", settings=s)
 
-    error = instance.client.query_and_get_error("ALTER TABLE test.drop_detached DROP DETACHED PART 'attaching_0_6_6_0'", settings=s)
+    error = instance.client.query_and_get_error("ALTER TABLE test.drop_detached DROP DETACHED PART 'attaching_0_6_6_0'",
+                                                settings=s)
     assert 0 <= error.find('Cannot drop part')
 
-    error = instance.client.query_and_get_error("ALTER TABLE test.drop_detached DROP DETACHED PART 'deleting_0_7_7_0'", settings=s)
+    error = instance.client.query_and_get_error("ALTER TABLE test.drop_detached DROP DETACHED PART 'deleting_0_7_7_0'",
+                                                settings=s)
     assert 0 <= error.find('Cannot drop part')
 
     q("ALTER TABLE test.drop_detached DROP DETACHED PART 'any_other_name'", settings=s)
diff --git a/tests/integration/test_parts_delete_zookeeper/test.py b/tests/integration/test_parts_delete_zookeeper/test.py
index 7e4a8d36741..7489b2411f9 100644
--- a/tests/integration/test_parts_delete_zookeeper/test.py
+++ b/tests/integration/test_parts_delete_zookeeper/test.py
@@ -1,11 +1,10 @@
 import time
+
 import pytest
-
-from helpers.network import PartitionManager
 from helpers.cluster import ClickHouseCluster
+from helpers.network import PartitionManager
 from helpers.test_tools import assert_eq_with_retry
 
-
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
@@ -55,7 +54,7 @@ def test_merge_doesnt_work_without_zookeeper(start_cluster):
     with PartitionManager() as pm:
         node1.query("OPTIMIZE TABLE test_table FINAL")
         pm.drop_instance_zk_connections(node1)
-        time.sleep(10) # > old_parts_lifetime
+        time.sleep(10)  # > old_parts_lifetime
         assert node1.query("SELECT count(*) from system.parts where table = 'test_table'") == "3\n"
 
     assert_eq_with_retry(node1, "SELECT count(*) from system.parts where table = 'test_table' and active = 1", "1")
diff --git a/tests/integration/test_polymorphic_parts/test.py b/tests/integration/test_polymorphic_parts/test.py
index ed89f768d4c..1729817cd53 100644
--- a/tests/integration/test_polymorphic_parts/test.py
+++ b/tests/integration/test_polymorphic_parts/test.py
@@ -1,75 +1,85 @@
-import time
-import pytest
+import os
 import random
 import string
-import os
 import struct
 
-from helpers.test_tools import TSV
-from helpers.test_tools import assert_eq_with_retry
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
-from multiprocessing.dummy import Pool
+from helpers.test_tools import TSV
+from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
+
 def get_random_array():
     return [random.randint(0, 1000) % 1000 for _ in range(random.randint(0, 1000))]
 
+
 def get_random_string():
     length = random.randint(0, 1000)
     return ''.join(random.choice(string.ascii_uppercase + string.digits) for _ in range(length))
 
+
 def insert_random_data(table, node, size):
     data = [
-    '(' + ','.join((
-        "'2019-10-11'",
-        str(i),
-        "'" + get_random_string() + "'",
-        str(get_random_array()))) +
-    ')' for i in range(size)
+        '(' + ','.join((
+            "'2019-10-11'",
+            str(i),
+            "'" + get_random_string() + "'",
+            str(get_random_array()))) +
+        ')' for i in range(size)
     ]
 
     node.query("INSERT INTO {} VALUES {}".format(table, ','.join(data)))
 
+
 def create_tables(name, nodes, node_settings, shard):
     for i, (node, settings) in enumerate(zip(nodes, node_settings)):
         node.query(
-        '''
-        CREATE TABLE {name}(date Date, id UInt32, s String, arr Array(Int32))
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/{name}', '{repl}')
-        PARTITION BY toYYYYMM(date)
-        ORDER BY id
-        SETTINGS index_granularity = 64, index_granularity_bytes = {index_granularity_bytes},
-        min_rows_for_wide_part = {min_rows_for_wide_part}, min_rows_for_compact_part = {min_rows_for_compact_part},
-        in_memory_parts_enable_wal = 1
-        '''.format(name=name, shard=shard, repl=i, **settings))
+            '''
+            CREATE TABLE {name}(date Date, id UInt32, s String, arr Array(Int32))
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/{name}', '{repl}')
+            PARTITION BY toYYYYMM(date)
+            ORDER BY id
+            SETTINGS index_granularity = 64, index_granularity_bytes = {index_granularity_bytes},
+            min_rows_for_wide_part = {min_rows_for_wide_part}, min_rows_for_compact_part = {min_rows_for_compact_part},
+            in_memory_parts_enable_wal = 1
+            '''.format(name=name, shard=shard, repl=i, **settings))
+
 
 def create_tables_old_format(name, nodes, shard):
     for i, node in enumerate(nodes):
         node.query(
-        '''
-        CREATE TABLE {name}(date Date, id UInt32, s String, arr Array(Int32))
-        ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/{name}', '{repl}', date, id, 64)
-        '''.format(name=name, shard=shard, repl=i))
+            '''
+            CREATE TABLE {name}(date Date, id UInt32, s String, arr Array(Int32))
+            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/{name}', '{repl}', date, id, 64)
+            '''.format(name=name, shard=shard, repl=i))
 
-node1 = cluster.add_instance('node1', main_configs=[], user_configs=["configs/users.d/not_optimize_count.xml"], with_zookeeper=True)
-node2 = cluster.add_instance('node2', main_configs=[], user_configs=["configs/users.d/not_optimize_count.xml"], with_zookeeper=True)
 
-settings_default = {'index_granularity_bytes' : 10485760, 'min_rows_for_wide_part' : 512, 'min_rows_for_compact_part' : 0}
-settings_compact_only = {'index_granularity_bytes' : 10485760, 'min_rows_for_wide_part' : 1000000, 'min_rows_for_compact_part' : 0}
-settings_not_adaptive = {'index_granularity_bytes' : 0, 'min_rows_for_wide_part' : 512, 'min_rows_for_compact_part' : 0}
+node1 = cluster.add_instance('node1', main_configs=[], user_configs=["configs/users.d/not_optimize_count.xml"],
+                             with_zookeeper=True)
+node2 = cluster.add_instance('node2', main_configs=[], user_configs=["configs/users.d/not_optimize_count.xml"],
+                             with_zookeeper=True)
 
-node3 = cluster.add_instance('node3', main_configs=[], user_configs=["configs/users.d/not_optimize_count.xml"], with_zookeeper=True)
-node4 = cluster.add_instance('node4', user_configs=["configs/users.d/not_optimize_count.xml"], main_configs=['configs/no_leader.xml'], with_zookeeper=True)
+settings_default = {'index_granularity_bytes': 10485760, 'min_rows_for_wide_part': 512, 'min_rows_for_compact_part': 0}
+settings_compact_only = {'index_granularity_bytes': 10485760, 'min_rows_for_wide_part': 1000000,
+                         'min_rows_for_compact_part': 0}
+settings_not_adaptive = {'index_granularity_bytes': 0, 'min_rows_for_wide_part': 512, 'min_rows_for_compact_part': 0}
 
-settings_compact = {'index_granularity_bytes' : 10485760, 'min_rows_for_wide_part' : 512, 'min_rows_for_compact_part' : 0}
-settings_wide = {'index_granularity_bytes' : 10485760, 'min_rows_for_wide_part' : 0, 'min_rows_for_compact_part' : 0}
+node3 = cluster.add_instance('node3', main_configs=[], user_configs=["configs/users.d/not_optimize_count.xml"],
+                             with_zookeeper=True)
+node4 = cluster.add_instance('node4', user_configs=["configs/users.d/not_optimize_count.xml"],
+                             main_configs=['configs/no_leader.xml'], with_zookeeper=True)
+
+settings_compact = {'index_granularity_bytes': 10485760, 'min_rows_for_wide_part': 512, 'min_rows_for_compact_part': 0}
+settings_wide = {'index_granularity_bytes': 10485760, 'min_rows_for_wide_part': 0, 'min_rows_for_compact_part': 0}
 
 node5 = cluster.add_instance('node5', main_configs=['configs/compact_parts.xml'], with_zookeeper=True)
 node6 = cluster.add_instance('node6', main_configs=['configs/compact_parts.xml'], with_zookeeper=True)
 
-settings_in_memory = {'index_granularity_bytes' : 10485760, 'min_rows_for_wide_part' : 512, 'min_rows_for_compact_part' : 256}
+settings_in_memory = {'index_granularity_bytes': 10485760, 'min_rows_for_wide_part': 512,
+                      'min_rows_for_compact_part': 256}
 
 node9 = cluster.add_instance('node9', with_zookeeper=True, stay_alive=True)
 node10 = cluster.add_instance('node10', with_zookeeper=True)
@@ -77,6 +87,7 @@ node10 = cluster.add_instance('node10', with_zookeeper=True)
 node11 = cluster.add_instance('node11', main_configs=['configs/do_not_merge.xml'], with_zookeeper=True, stay_alive=True)
 node12 = cluster.add_instance('node12', main_configs=['configs/do_not_merge.xml'], with_zookeeper=True, stay_alive=True)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -100,11 +111,12 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 @pytest.mark.parametrize(
     ('first_node', 'second_node'),
     [
-        (node1, node2), # compact parts
-        (node5, node6), # compact parts, old-format
+        (node1, node2),  # compact parts
+        (node5, node6),  # compact parts, old-format
     ]
 )
 def test_polymorphic_parts_basics(start_cluster, first_node, second_node):
@@ -121,9 +133,11 @@ def test_polymorphic_parts_basics(start_cluster, first_node, second_node):
     expected = "Compact\t2\nWide\t1\n"
 
     assert TSV(first_node.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'polymorphic_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(expected)
+                                "WHERE table = 'polymorphic_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        expected)
     assert TSV(second_node.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'polymorphic_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(expected)
+                                 "WHERE table = 'polymorphic_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        expected)
 
     first_node.query("SYSTEM START MERGES")
     second_node.query("SYSTEM START MERGES")
@@ -144,8 +158,10 @@ def test_polymorphic_parts_basics(start_cluster, first_node, second_node):
     assert first_node.query("SELECT count() FROM polymorphic_table") == "2000\n"
     assert second_node.query("SELECT count() FROM polymorphic_table") == "2000\n"
 
-    assert first_node.query("SELECT DISTINCT part_type FROM system.parts WHERE table = 'polymorphic_table' AND active") == "Wide\n"
-    assert second_node.query("SELECT DISTINCT part_type FROM system.parts WHERE table = 'polymorphic_table' AND active") == "Wide\n"
+    assert first_node.query(
+        "SELECT DISTINCT part_type FROM system.parts WHERE table = 'polymorphic_table' AND active") == "Wide\n"
+    assert second_node.query(
+        "SELECT DISTINCT part_type FROM system.parts WHERE table = 'polymorphic_table' AND active") == "Wide\n"
 
     # Check alters and mutations also work
     first_node.query("ALTER TABLE polymorphic_table ADD COLUMN ss String")
@@ -159,6 +175,7 @@ def test_polymorphic_parts_basics(start_cluster, first_node, second_node):
     second_node.query("SELECT count(ss) FROM polymorphic_table") == "2000\n"
     second_node.query("SELECT uniqExact(ss) FROM polymorphic_table") == "600\n"
 
+
 # Checks mostly that merge from compact part to compact part works.
 def test_compact_parts_only(start_cluster):
     for i in range(20):
@@ -171,8 +188,10 @@ def test_compact_parts_only(start_cluster):
     assert node1.query("SELECT count() FROM compact_parts_only") == "4000\n"
     assert node2.query("SELECT count() FROM compact_parts_only") == "4000\n"
 
-    assert node1.query("SELECT DISTINCT part_type FROM system.parts WHERE table = 'compact_parts_only' AND active") == "Compact\n"
-    assert node2.query("SELECT DISTINCT part_type FROM system.parts WHERE table = 'compact_parts_only' AND active") == "Compact\n"
+    assert node1.query(
+        "SELECT DISTINCT part_type FROM system.parts WHERE table = 'compact_parts_only' AND active") == "Compact\n"
+    assert node2.query(
+        "SELECT DISTINCT part_type FROM system.parts WHERE table = 'compact_parts_only' AND active") == "Compact\n"
 
     node1.query("OPTIMIZE TABLE compact_parts_only FINAL")
     node2.query("SYSTEM SYNC REPLICA compact_parts_only", timeout=20)
@@ -180,9 +199,12 @@ def test_compact_parts_only(start_cluster):
 
     expected = "Compact\t1\n"
     assert TSV(node1.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'compact_parts_only' AND active GROUP BY part_type ORDER BY part_type")) == TSV(expected)
+                           "WHERE table = 'compact_parts_only' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        expected)
     assert TSV(node2.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'compact_parts_only' AND active GROUP BY part_type ORDER BY part_type")) == TSV(expected)
+                           "WHERE table = 'compact_parts_only' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        expected)
+
 
 # Check that follower replicas create parts of the same type, which leader has chosen at merge.
 @pytest.mark.parametrize(
@@ -208,16 +230,21 @@ def test_different_part_types_on_replicas(start_cluster, table, part_type):
     expected = "{}\t1\n".format(part_type)
 
     assert TSV(leader.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = '{}' AND active GROUP BY part_type ORDER BY part_type".format(table))) == TSV(expected)
+                            "WHERE table = '{}' AND active GROUP BY part_type ORDER BY part_type".format(
+        table))) == TSV(expected)
     assert TSV(follower.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = '{}' AND active GROUP BY part_type ORDER BY part_type".format(table))) == TSV(expected)
+                              "WHERE table = '{}' AND active GROUP BY part_type ORDER BY part_type".format(
+        table))) == TSV(expected)
 
 
-node7 = cluster.add_instance('node7', user_configs=["configs_old/users.d/not_optimize_count.xml"], with_zookeeper=True, image='yandex/clickhouse-server', tag='19.17.8.54', stay_alive=True, with_installed_binary=True)
+node7 = cluster.add_instance('node7', user_configs=["configs_old/users.d/not_optimize_count.xml"], with_zookeeper=True,
+                             image='yandex/clickhouse-server', tag='19.17.8.54', stay_alive=True,
+                             with_installed_binary=True)
 node8 = cluster.add_instance('node8', user_configs=["configs/users.d/not_optimize_count.xml"], with_zookeeper=True)
 
-settings7 = {'index_granularity_bytes' : 10485760}
-settings8 = {'index_granularity_bytes' : 10485760, 'min_rows_for_wide_part' : 512, 'min_rows_for_compact_part' : 0}
+settings7 = {'index_granularity_bytes': 10485760}
+settings8 = {'index_granularity_bytes': 10485760, 'min_rows_for_wide_part': 512, 'min_rows_for_compact_part': 0}
+
 
 @pytest.fixture(scope="module")
 def start_cluster_diff_versions():
@@ -225,24 +252,24 @@ def start_cluster_diff_versions():
         for name in ['polymorphic_table', 'polymorphic_table_2']:
             cluster.start()
             node7.query(
-            '''
-            CREATE TABLE {name}(date Date, id UInt32, s String, arr Array(Int32))
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard5/{name}', '1')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-            SETTINGS index_granularity = 64, index_granularity_bytes = {index_granularity_bytes}
-            '''.format(name=name, **settings7)
+                '''
+                CREATE TABLE {name}(date Date, id UInt32, s String, arr Array(Int32))
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard5/{name}', '1')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+                SETTINGS index_granularity = 64, index_granularity_bytes = {index_granularity_bytes}
+                '''.format(name=name, **settings7)
             )
 
             node8.query(
-            '''
-            CREATE TABLE {name}(date Date, id UInt32, s String, arr Array(Int32))
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard5/{name}', '2')
-            PARTITION BY toYYYYMM(date)
-            ORDER BY id
-            SETTINGS index_granularity = 64, index_granularity_bytes = {index_granularity_bytes},
-            min_rows_for_wide_part = {min_rows_for_wide_part}, min_bytes_for_wide_part = {min_bytes_for_wide_part}
-            '''.format(name=name, **settings8)
+                '''
+                CREATE TABLE {name}(date Date, id UInt32, s String, arr Array(Int32))
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/shard5/{name}', '2')
+                PARTITION BY toYYYYMM(date)
+                ORDER BY id
+                SETTINGS index_granularity = 64, index_granularity_bytes = {index_granularity_bytes},
+                min_rows_for_wide_part = {min_rows_for_wide_part}, min_bytes_for_wide_part = {min_bytes_for_wide_part}
+                '''.format(name=name, **settings8)
             )
 
         yield cluster
@@ -262,7 +289,8 @@ def test_polymorphic_parts_diff_versions(start_cluster_diff_versions):
     node8.query("SYSTEM SYNC REPLICA polymorphic_table", timeout=20)
 
     assert node8.query("SELECT count() FROM polymorphic_table") == "100\n"
-    assert node8.query("SELECT DISTINCT part_type FROM system.parts WHERE table = 'polymorphic_table' and active") == "Wide\n"
+    assert node8.query(
+        "SELECT DISTINCT part_type FROM system.parts WHERE table = 'polymorphic_table' and active") == "Wide\n"
 
 
 @pytest.mark.skip(reason="compatability is temporary broken")
@@ -286,7 +314,8 @@ def test_polymorphic_parts_diff_versions_2(start_cluster_diff_versions):
 
     # Works after update
     assert node_old.query("SELECT count() FROM polymorphic_table_2") == "100\n"
-    assert node_old.query("SELECT DISTINCT part_type FROM system.parts WHERE table = 'polymorphic_table_2' and active") == "Compact\n"
+    assert node_old.query(
+        "SELECT DISTINCT part_type FROM system.parts WHERE table = 'polymorphic_table_2' and active") == "Compact\n"
 
 
 def test_polymorphic_parts_non_adaptive(start_cluster):
@@ -300,11 +329,15 @@ def test_polymorphic_parts_non_adaptive(start_cluster):
     node1.query("SYSTEM SYNC REPLICA non_adaptive_table", timeout=20)
 
     assert TSV(node1.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'non_adaptive_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV("Wide\t2\n")
+                           "WHERE table = 'non_adaptive_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        "Wide\t2\n")
     assert TSV(node2.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'non_adaptive_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV("Wide\t2\n")
+                           "WHERE table = 'non_adaptive_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        "Wide\t2\n")
+
+    assert node1.contains_in_log(
+        "<Warning> default.non_adaptive_table: Table can't create parts with adaptive granularity")
 
-    assert node1.contains_in_log("<Warning> default.non_adaptive_table: Table can't create parts with adaptive granularity")
 
 def test_in_memory(start_cluster):
     node9.query("SYSTEM STOP MERGES")
@@ -320,9 +353,11 @@ def test_in_memory(start_cluster):
     expected = "Compact\t1\nInMemory\t2\nWide\t1\n"
 
     assert TSV(node9.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'in_memory_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(expected)
+                           "WHERE table = 'in_memory_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        expected)
     assert TSV(node10.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'in_memory_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(expected)
+                            "WHERE table = 'in_memory_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        expected)
 
     node9.query("SYSTEM START MERGES")
     node10.query("SYSTEM START MERGES")
@@ -334,9 +369,12 @@ def test_in_memory(start_cluster):
     assert node10.query("SELECT count() FROM in_memory_table") == "1300\n"
 
     assert TSV(node9.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'in_memory_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV("Wide\t1\n")
+                           "WHERE table = 'in_memory_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        "Wide\t1\n")
     assert TSV(node10.query("SELECT part_type, count() FROM system.parts " \
-        "WHERE table = 'in_memory_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV("Wide\t1\n")
+                            "WHERE table = 'in_memory_table' AND active GROUP BY part_type ORDER BY part_type")) == TSV(
+        "Wide\t1\n")
+
 
 def test_in_memory_wal(start_cluster):
     # Merges are disabled in config
@@ -347,7 +385,9 @@ def test_in_memory_wal(start_cluster):
 
     def check(node, rows, parts):
         node.query("SELECT count() FROM wal_table") == "{}\n".format(rows)
-        node.query("SELECT count() FROM system.parts WHERE table = 'wal_table' AND part_type = 'InMemory'") == "{}\n".format(parts)
+        node.query(
+            "SELECT count() FROM system.parts WHERE table = 'wal_table' AND part_type = 'InMemory'") == "{}\n".format(
+            parts)
 
     check(node11, 250, 5)
     check(node12, 250, 5)
@@ -383,7 +423,7 @@ def test_in_memory_wal(start_cluster):
     node11.query("SYSTEM SYNC REPLICA wal_table", timeout=20)
     check(node11, 300, 6)
 
-    #Check that new data is written to new wal, but old is still exists for restoring
+    # Check that new data is written to new wal, but old is still exists for restoring
     assert os.path.getsize(wal_file) > 0
     assert os.path.exists(broken_wal_file)
 
@@ -398,6 +438,7 @@ def test_in_memory_wal(start_cluster):
         node11.restart_clickhouse(kill=True)
         check(node11, 300, 6)
 
+
 def test_in_memory_wal_rotate(start_cluster):
     # Write every part to single wal
     node11.query("ALTER TABLE restore_table MODIFY SETTING write_ahead_log_max_bytes = 10")
@@ -409,7 +450,8 @@ def test_in_memory_wal_rotate(start_cluster):
         assert os.path.exists(wal_file)
 
     for node in [node11, node12]:
-        node.query("ALTER TABLE restore_table MODIFY SETTING number_of_free_entries_in_pool_to_lower_max_size_of_merge = 0")
+        node.query(
+            "ALTER TABLE restore_table MODIFY SETTING number_of_free_entries_in_pool_to_lower_max_size_of_merge = 0")
         node.query("ALTER TABLE restore_table MODIFY SETTING max_bytes_to_merge_at_max_space_in_pool = 10000000")
 
     assert_eq_with_retry(node11, "OPTIMIZE TABLE restore_table FINAL SETTINGS optimize_throw_if_noop = 1", "")
@@ -425,6 +467,7 @@ def test_in_memory_wal_rotate(start_cluster):
     assert os.path.exists(wal_file)
     assert os.path.getsize(wal_file) == 0
 
+
 def test_in_memory_deduplication(start_cluster):
     for i in range(3):
         node9.query("INSERT INTO deduplication_table (date, id, s) VALUES (toDate('2020-03-03'), 1, 'foo')")
@@ -436,13 +479,15 @@ def test_in_memory_deduplication(start_cluster):
     assert node9.query("SELECT date, id, s FROM deduplication_table") == "2020-03-03\t1\tfoo\n"
     assert node10.query("SELECT date, id, s FROM deduplication_table") == "2020-03-03\t1\tfoo\n"
 
+
 # Checks that restoring from WAL works after table schema changed
 def test_in_memory_alters(start_cluster):
     def check_parts_type(parts_num):
         assert node9.query("SELECT part_type, count() FROM system.parts WHERE table = 'alters_table' \
              AND active GROUP BY part_type") == "InMemory\t{}\n".format(parts_num)
 
-    node9.query("INSERT INTO alters_table (date, id, s) VALUES (toDate('2020-10-10'), 1, 'ab'), (toDate('2020-10-10'), 2, 'cd')")
+    node9.query(
+        "INSERT INTO alters_table (date, id, s) VALUES (toDate('2020-10-10'), 1, 'ab'), (toDate('2020-10-10'), 2, 'cd')")
     node9.query("ALTER TABLE alters_table ADD COLUMN col1 UInt32")
     node9.restart_clickhouse(kill=True)
 
@@ -462,6 +507,7 @@ def test_in_memory_alters(start_cluster):
     expected = expected = "1\t0_foo\n2\t0_foo\n3\t100_foo\n"
     assert node9.query("SELECT id, col1 || '_foo' FROM alters_table")
 
+
 def test_polymorphic_parts_index(start_cluster):
     node1.query('''
         CREATE TABLE index_compact(a UInt32, s String)
diff --git a/tests/integration/test_postgresql_protocol/test.py b/tests/integration/test_postgresql_protocol/test.py
index 939e8231931..513bb75fcab 100644
--- a/tests/integration/test_postgresql_protocol/test.py
+++ b/tests/integration/test_postgresql_protocol/test.py
@@ -4,16 +4,16 @@ from __future__ import print_function
 
 import datetime
 import decimal
+import os
+import subprocess
+import sys
+import time
+import uuid
+
 import docker
 import psycopg2 as py_psql
 import psycopg2.extras
 import pytest
-import os
-import sys
-import subprocess
-import time
-import uuid
-
 from helpers.cluster import ClickHouseCluster, get_docker_compose_path
 
 psycopg2.extras.register_uuid()
@@ -24,7 +24,8 @@ DOCKER_COMPOSE_PATH = get_docker_compose_path()
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', main_configs=["configs/postresql.xml", "configs/log.xml", "configs/ssl_conf.xml",
                                                   "configs/dhparam.pem", "configs/server.crt", "configs/server.key"],
-                            user_configs=["configs/default_passwd.xml"], env_variables={'UBSAN_OPTIONS': 'print_stacktrace=1'})
+                            user_configs=["configs/default_passwd.xml"],
+                            env_variables={'UBSAN_OPTIONS': 'print_stacktrace=1'})
 
 server_port = 5433
 
@@ -41,7 +42,8 @@ def server_address():
 @pytest.fixture(scope='module')
 def psql_client():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_postgesql.yml')
-    subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--build'])
+    subprocess.check_call(
+        ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--build'])
     yield docker.from_env().containers.get(cluster.project_name + '_psql_1')
 
 
@@ -64,7 +66,8 @@ def psql_server(psql_client):
 @pytest.fixture(scope='module')
 def java_container():
     docker_compose = os.path.join(DOCKER_COMPOSE_PATH, 'docker_compose_postgesql_java_client.yml')
-    subprocess.check_call(['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--build'])
+    subprocess.check_call(
+        ['docker-compose', '-p', cluster.project_name, '-f', docker_compose, 'up', '--no-recreate', '-d', '--build'])
     yield docker.from_env().containers.get(cluster.project_name + '_java_1')
 
 
@@ -73,7 +76,7 @@ def test_psql_is_ready(psql_server):
 
 
 def test_psql_client(psql_client, server_address):
-    cmd_prefix = 'psql "sslmode=require host={server_address} port={server_port} user=default dbname=default password=123" '\
+    cmd_prefix = 'psql "sslmode=require host={server_address} port={server_port} user=default dbname=default password=123" ' \
         .format(server_address=server_address, server_port=server_port)
     cmd_prefix += "--no-align --field-separator=' ' "
 
@@ -116,7 +119,8 @@ def test_python_client(server_address):
         cur = ch.cursor()
         cur.execute('select name from tables;')
 
-    assert exc_info.value.args == ("Query execution failed.\nDB::Exception: Table default.tables doesn't exist.\nSSL connection has been closed unexpectedly\n",)
+    assert exc_info.value.args == (
+        "Query execution failed.\nDB::Exception: Table default.tables doesn't exist.\nSSL connection has been closed unexpectedly\n",)
 
     ch = py_psql.connect(host=server_address, port=server_port, user='default', password='123', database='')
     cur = ch.cursor()
@@ -127,10 +131,14 @@ def test_python_client(server_address):
 
     cur.execute('CREATE DATABASE x')
     cur.execute('USE x')
-    cur.execute('CREATE TEMPORARY TABLE tmp2 (ch Int8, i64 Int64, f64 Float64, str String, date Date, dec Decimal(19, 10), uuid UUID) ENGINE = Memory')
-    cur.execute("insert into tmp2 (ch, i64, f64, str, date, dec, uuid) values (44, 534324234, 0.32423423, 'hello', '2019-01-23', 0.333333, '61f0c404-5cb3-11e7-907b-a6006ad3dba0')")
+    cur.execute(
+        'CREATE TEMPORARY TABLE tmp2 (ch Int8, i64 Int64, f64 Float64, str String, date Date, dec Decimal(19, 10), uuid UUID) ENGINE = Memory')
+    cur.execute(
+        "insert into tmp2 (ch, i64, f64, str, date, dec, uuid) values (44, 534324234, 0.32423423, 'hello', '2019-01-23', 0.333333, '61f0c404-5cb3-11e7-907b-a6006ad3dba0')")
     cur.execute('select * from tmp2')
-    assert cur.fetchall()[0] == ('44', 534324234, 0.32423423, 'hello', datetime.date(2019, 1, 23), decimal.Decimal('0.3333330000'), uuid.UUID('61f0c404-5cb3-11e7-907b-a6006ad3dba0'))
+    assert cur.fetchall()[0] == (
+        '44', 534324234, 0.32423423, 'hello', datetime.date(2019, 1, 23), decimal.Decimal('0.3333330000'),
+        uuid.UUID('61f0c404-5cb3-11e7-907b-a6006ad3dba0'))
 
 
 def test_java_client(server_address, java_container):
@@ -138,13 +146,15 @@ def test_java_client(server_address, java_container):
         reference = fp.read()
 
     # database not exists exception.
-    code, (stdout, stderr) = java_container.exec_run('java JavaConnectorTest --host {host} --port {port} --user default --database '
-                                                     'abc'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = java_container.exec_run(
+        'java JavaConnectorTest --host {host} --port {port} --user default --database '
+        'abc'.format(host=server_address, port=server_port), demux=True)
     assert code == 1
 
     # non-empty password passed.
-    code, (stdout, stderr) = java_container.exec_run('java JavaConnectorTest --host {host} --port {port} --user default --password 123 --database '
-                                                     'default'.format(host=server_address, port=server_port), demux=True)
+    code, (stdout, stderr) = java_container.exec_run(
+        'java JavaConnectorTest --host {host} --port {port} --user default --password 123 --database '
+        'default'.format(host=server_address, port=server_port), demux=True)
     print(stdout, stderr, file=sys.stderr)
     assert code == 0
     assert stdout == reference
diff --git a/tests/integration/test_profile_events_s3/test.py b/tests/integration/test_profile_events_s3/test.py
index e2cb10499e7..3d65a489610 100644
--- a/tests/integration/test_profile_events_s3/test.py
+++ b/tests/integration/test_profile_events_s3/test.py
@@ -1,11 +1,8 @@
 import logging
-import random
-import string
-import time
 import re
-import requests
 
 import pytest
+import requests
 from helpers.cluster import ClickHouseCluster
 
 logging.getLogger().setLevel(logging.INFO)
@@ -17,7 +14,8 @@ def cluster():
     try:
         cluster = ClickHouseCluster(__file__)
 
-        cluster.add_instance("node", main_configs=["configs/config.d/storage_conf.xml", "configs/log.xml",  "configs/query_log.xml",  "configs/ssl_conf.xml"], with_minio=True)
+        cluster.add_instance("node", main_configs=["configs/config.d/storage_conf.xml", "configs/log.xml",
+                                                   "configs/query_log.xml", "configs/ssl_conf.xml"], with_minio=True)
 
         logging.info("Starting cluster...")
         cluster.start()
@@ -29,20 +27,21 @@ def cluster():
 
 
 init_list = {
-    "S3ReadMicroseconds" : 0,
-    "S3ReadBytes" : 0,
-    "S3ReadRequestsCount" : 0,
-    "S3ReadRequestsErrorsTotal" : 0,
-    "S3ReadRequestsErrors503" : 0,
-    "S3ReadRequestsRedirects" : 0,
-    "S3WriteMicroseconds" : 0,
-    "S3WriteBytes" : 0,
-    "S3WriteRequestsCount" : 0,
-    "S3WriteRequestsErrorsTotal" : 0,
-    "S3WriteRequestsErrors503" : 0,
-    "S3WriteRequestsRedirects" : 0,
+    "S3ReadMicroseconds": 0,
+    "S3ReadBytes": 0,
+    "S3ReadRequestsCount": 0,
+    "S3ReadRequestsErrorsTotal": 0,
+    "S3ReadRequestsErrors503": 0,
+    "S3ReadRequestsRedirects": 0,
+    "S3WriteMicroseconds": 0,
+    "S3WriteBytes": 0,
+    "S3WriteRequestsCount": 0,
+    "S3WriteRequestsErrorsTotal": 0,
+    "S3WriteRequestsErrors503": 0,
+    "S3WriteRequestsRedirects": 0,
 }
 
+
 def get_s3_events(instance):
     result = init_list.copy()
     events = instance.query("SELECT event,value FROM system.events WHERE event LIKE 'S3%'").split("\n")
@@ -55,13 +54,14 @@ def get_s3_events(instance):
 
 def get_minio_stat(cluster):
     result = {
-        "get_requests" : 0,
-        "set_requests" : 0,
-        "errors" : 0,
-        "rx_bytes" : 0,
-        "tx_bytes" : 0,
+        "get_requests": 0,
+        "set_requests": 0,
+        "errors": 0,
+        "rx_bytes": 0,
+        "tx_bytes": 0,
     }
-    stat = requests.get(url="http://{}:{}/minio/prometheus/metrics".format("localhost", cluster.minio_port)).text.split("\n")
+    stat = requests.get(url="http://{}:{}/minio/prometheus/metrics".format("localhost", cluster.minio_port)).text.split(
+        "\n")
     for line in stat:
         x = re.search("s3_requests_total(\{.*\})?\s(\d+)(\s.*)?", line)
         if x != None:
@@ -126,8 +126,10 @@ def test_profile_events(cluster):
     metrics1 = get_s3_events(instance)
     minio1 = get_minio_stat(cluster)
 
-    assert metrics1["S3ReadRequestsCount"] - metrics0["S3ReadRequestsCount"] == minio1["get_requests"] - minio0["get_requests"] - 1 # 1 from get_minio_size
-    assert metrics1["S3WriteRequestsCount"] - metrics0["S3WriteRequestsCount"] == minio1["set_requests"] - minio0["set_requests"]
+    assert metrics1["S3ReadRequestsCount"] - metrics0["S3ReadRequestsCount"] == minio1["get_requests"] - minio0[
+        "get_requests"] - 1  # 1 from get_minio_size
+    assert metrics1["S3WriteRequestsCount"] - metrics0["S3WriteRequestsCount"] == minio1["set_requests"] - minio0[
+        "set_requests"]
     stat1 = get_query_stat(instance, query1)
     for metric in stat1:
         assert stat1[metric] == metrics1[metric] - metrics0[metric]
@@ -140,8 +142,10 @@ def test_profile_events(cluster):
     metrics2 = get_s3_events(instance)
     minio2 = get_minio_stat(cluster)
 
-    assert metrics2["S3ReadRequestsCount"] - metrics1["S3ReadRequestsCount"] == minio2["get_requests"] - minio1["get_requests"] - 1 # 1 from get_minio_size
-    assert metrics2["S3WriteRequestsCount"] - metrics1["S3WriteRequestsCount"] == minio2["set_requests"] - minio1["set_requests"]
+    assert metrics2["S3ReadRequestsCount"] - metrics1["S3ReadRequestsCount"] == minio2["get_requests"] - minio1[
+        "get_requests"] - 1  # 1 from get_minio_size
+    assert metrics2["S3WriteRequestsCount"] - metrics1["S3WriteRequestsCount"] == minio2["set_requests"] - minio1[
+        "set_requests"]
     stat2 = get_query_stat(instance, query2)
     for metric in stat2:
         assert stat2[metric] == metrics2[metric] - metrics1[metric]
@@ -153,8 +157,10 @@ def test_profile_events(cluster):
     metrics3 = get_s3_events(instance)
     minio3 = get_minio_stat(cluster)
 
-    assert metrics3["S3ReadRequestsCount"] - metrics2["S3ReadRequestsCount"] == minio3["get_requests"] - minio2["get_requests"]
-    assert metrics3["S3WriteRequestsCount"] - metrics2["S3WriteRequestsCount"] == minio3["set_requests"] - minio2["set_requests"]
+    assert metrics3["S3ReadRequestsCount"] - metrics2["S3ReadRequestsCount"] == minio3["get_requests"] - minio2[
+        "get_requests"]
+    assert metrics3["S3WriteRequestsCount"] - metrics2["S3WriteRequestsCount"] == minio3["set_requests"] - minio2[
+        "set_requests"]
     stat3 = get_query_stat(instance, query3)
     for metric in stat3:
         assert stat3[metric] == metrics3[metric] - metrics2[metric]
diff --git a/tests/integration/test_prometheus_endpoint/test.py b/tests/integration/test_prometheus_endpoint/test.py
index 25d83cfb47c..909dbf139b9 100644
--- a/tests/integration/test_prometheus_endpoint/test.py
+++ b/tests/integration/test_prometheus_endpoint/test.py
@@ -1,15 +1,16 @@
 from __future__ import print_function
-import pytest
 
 import re
-import requests
 import time
 
+import pytest
+import requests
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', main_configs=['configs/prom_conf.xml'])
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -66,7 +67,6 @@ def get_and_check_metrics(retries):
 
 
 def test_prometheus_endpoint(start_cluster):
-
     metrics_dict = get_and_check_metrics(10)
     assert metrics_dict['ClickHouseProfileEvents_Query'] >= 0
     prev_query_count = metrics_dict['ClickHouseProfileEvents_Query']
diff --git a/tests/integration/test_quorum_inserts/test.py b/tests/integration/test_quorum_inserts/test.py
index e89611c0d99..0adee0afc64 100644
--- a/tests/integration/test_quorum_inserts/test.py
+++ b/tests/integration/test_quorum_inserts/test.py
@@ -1,9 +1,8 @@
 import time
 
 import pytest
-
-from helpers.test_tools import TSV
 from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import TSV
 
 cluster = ClickHouseCluster(__file__)
 
@@ -19,10 +18,12 @@ second = cluster.add_instance("second", user_configs=["configs/users.d/settings.
                               macros={"cluster": "anime", "shard": "0", "replica": "second"},
                               with_zookeeper=True)
 
+
 def execute_on_all_cluster(query_):
     for node in [zero, first, second]:
         node.query(query_)
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     global cluster
@@ -47,7 +48,7 @@ def test_simple_add_replica(started_cluster):
 
     first.query("SYSTEM STOP FETCHES test_simple")
 
-    zero.query("INSERT INTO test_simple VALUES (1, '2011-01-01')", settings={'insert_quorum' : 1})
+    zero.query("INSERT INTO test_simple VALUES (1, '2011-01-01')", settings={'insert_quorum': 1})
 
     assert '1\t2011-01-01\n' == zero.query("SELECT * from test_simple")
     assert '' == first.query("SELECT * from test_simple")
@@ -69,7 +70,6 @@ def test_simple_add_replica(started_cluster):
     execute_on_all_cluster("DROP TABLE IF EXISTS test_simple")
 
 
-
 def test_drop_replica_and_achieve_quorum(started_cluster):
     execute_on_all_cluster("DROP TABLE IF EXISTS test_drop_replica_and_achieve_quorum")
 
@@ -86,23 +86,24 @@ def test_drop_replica_and_achieve_quorum(started_cluster):
     first.query("SYSTEM STOP FETCHES test_drop_replica_and_achieve_quorum")
 
     print("Insert to other replica. This query will fail.")
-    quorum_timeout = zero.query_and_get_error("INSERT INTO test_drop_replica_and_achieve_quorum(a,d) VALUES (1, '2011-01-01')",
-                                              settings={'insert_quorum_timeout' : 5000})
+    quorum_timeout = zero.query_and_get_error(
+        "INSERT INTO test_drop_replica_and_achieve_quorum(a,d) VALUES (1, '2011-01-01')",
+        settings={'insert_quorum_timeout': 5000})
     assert "Timeout while waiting for quorum" in quorum_timeout, "Query must fail."
 
     assert TSV("1\t2011-01-01\n") == TSV(zero.query("SELECT * FROM test_drop_replica_and_achieve_quorum",
-                                          settings={'select_sequential_consistency' : 0}))
+                                                    settings={'select_sequential_consistency': 0}))
 
     assert TSV("") == TSV(zero.query("SELECT * FROM test_drop_replica_and_achieve_quorum",
-                                           settings={'select_sequential_consistency' : 1}))
+                                     settings={'select_sequential_consistency': 1}))
 
-    #TODO:(Mikhaylov) begin; maybe delete this lines. I want clickhouse to fetch parts and update quorum.
+    # TODO:(Mikhaylov) begin; maybe delete this lines. I want clickhouse to fetch parts and update quorum.
     print("START FETCHES first replica")
     first.query("SYSTEM START FETCHES test_drop_replica_and_achieve_quorum")
 
     print("SYNC first replica")
     first.query("SYSTEM SYNC REPLICA test_drop_replica_and_achieve_quorum", timeout=20)
-    #TODO:(Mikhaylov) end
+    # TODO:(Mikhaylov) end
 
     print("Add second replica")
     second.query(create_query)
@@ -112,14 +113,17 @@ def test_drop_replica_and_achieve_quorum(started_cluster):
 
     print("Quorum for previous insert achieved.")
     assert TSV("1\t2011-01-01\n") == TSV(second.query("SELECT * FROM test_drop_replica_and_achieve_quorum",
-                                            settings={'select_sequential_consistency' : 1}))
+                                                      settings={'select_sequential_consistency': 1}))
 
     print("Now we can insert some other data.")
     zero.query("INSERT INTO test_drop_replica_and_achieve_quorum(a,d) VALUES (2, '2012-02-02')")
 
-    assert TSV("1\t2011-01-01\n2\t2012-02-02\n") == TSV(zero.query("SELECT * FROM test_drop_replica_and_achieve_quorum ORDER BY a"))
-    assert TSV("1\t2011-01-01\n2\t2012-02-02\n") == TSV(first.query("SELECT * FROM test_drop_replica_and_achieve_quorum ORDER BY a"))
-    assert TSV("1\t2011-01-01\n2\t2012-02-02\n") == TSV(second.query("SELECT * FROM test_drop_replica_and_achieve_quorum ORDER BY a"))
+    assert TSV("1\t2011-01-01\n2\t2012-02-02\n") == TSV(
+        zero.query("SELECT * FROM test_drop_replica_and_achieve_quorum ORDER BY a"))
+    assert TSV("1\t2011-01-01\n2\t2012-02-02\n") == TSV(
+        first.query("SELECT * FROM test_drop_replica_and_achieve_quorum ORDER BY a"))
+    assert TSV("1\t2011-01-01\n2\t2012-02-02\n") == TSV(
+        second.query("SELECT * FROM test_drop_replica_and_achieve_quorum ORDER BY a"))
 
     execute_on_all_cluster("DROP TABLE IF EXISTS test_drop_replica_and_achieve_quorum")
 
@@ -131,7 +135,6 @@ def test_drop_replica_and_achieve_quorum(started_cluster):
         True
     ]
 )
-
 def test_insert_quorum_with_drop_partition(started_cluster, add_new_data):
     execute_on_all_cluster("DROP TABLE IF EXISTS test_quorum_insert_with_drop_partition")
 
@@ -186,21 +189,20 @@ def test_insert_quorum_with_drop_partition(started_cluster, add_new_data):
         True
     ]
 )
-
 def test_insert_quorum_with_move_partition(started_cluster, add_new_data):
     execute_on_all_cluster("DROP TABLE IF EXISTS test_insert_quorum_with_move_partition_source")
     execute_on_all_cluster("DROP TABLE IF EXISTS test_insert_quorum_with_move_partition_destination")
 
     create_source = "CREATE TABLE test_insert_quorum_with_move_partition_source " \
-                   "(a Int8, d Date) " \
-                   "Engine = ReplicatedMergeTree('/clickhouse/tables/{shard}/{table}', '{replica}') " \
-                   "PARTITION BY d ORDER BY a "
-
-    create_destination = "CREATE TABLE test_insert_quorum_with_move_partition_destination " \
                     "(a Int8, d Date) " \
                     "Engine = ReplicatedMergeTree('/clickhouse/tables/{shard}/{table}', '{replica}') " \
                     "PARTITION BY d ORDER BY a "
 
+    create_destination = "CREATE TABLE test_insert_quorum_with_move_partition_destination " \
+                         "(a Int8, d Date) " \
+                         "Engine = ReplicatedMergeTree('/clickhouse/tables/{shard}/{table}', '{replica}') " \
+                         "PARTITION BY d ORDER BY a "
+
     print("Create source Replicated table with three replicas")
     zero.query(create_source)
     first.query(create_source)
@@ -218,7 +220,8 @@ def test_insert_quorum_with_move_partition(started_cluster, add_new_data):
     zero.query("INSERT INTO test_insert_quorum_with_move_partition_source(a,d) VALUES(1, '2011-01-01')")
 
     print("Drop partition.")
-    zero.query("ALTER TABLE test_insert_quorum_with_move_partition_source MOVE PARTITION '2011-01-01' TO TABLE test_insert_quorum_with_move_partition_destination")
+    zero.query(
+        "ALTER TABLE test_insert_quorum_with_move_partition_source MOVE PARTITION '2011-01-01' TO TABLE test_insert_quorum_with_move_partition_destination")
 
     if (add_new_data):
         print("Insert to deleted partition")
@@ -237,7 +240,8 @@ def test_insert_quorum_with_move_partition(started_cluster, add_new_data):
     print("Select from updated partition.")
     if (add_new_data):
         assert TSV("2\t2011-01-01\n") == TSV(zero.query("SELECT * FROM test_insert_quorum_with_move_partition_source"))
-        assert TSV("2\t2011-01-01\n") == TSV(second.query("SELECT * FROM test_insert_quorum_with_move_partition_source"))
+        assert TSV("2\t2011-01-01\n") == TSV(
+            second.query("SELECT * FROM test_insert_quorum_with_move_partition_source"))
     else:
         assert TSV("") == TSV(zero.query("SELECT * FROM test_insert_quorum_with_move_partition_source"))
         assert TSV("") == TSV(second.query("SELECT * FROM test_insert_quorum_with_move_partition_source"))
@@ -265,12 +269,13 @@ def test_insert_quorum_with_ttl(started_cluster):
 
     print("Insert should fail since it can not reach the quorum.")
     quorum_timeout = zero.query_and_get_error("INSERT INTO test_insert_quorum_with_ttl(a,d) VALUES(1, '2011-01-01')",
-                                              settings={'insert_quorum_timeout' : 5000})
+                                              settings={'insert_quorum_timeout': 5000})
     assert "Timeout while waiting for quorum" in quorum_timeout, "Query must fail."
 
     print("Wait 10 seconds and TTL merge have to be executed. But it won't delete data.")
     time.sleep(10)
-    assert TSV("1\t2011-01-01\n") == TSV(zero.query("SELECT * FROM test_insert_quorum_with_ttl", settings={'select_sequential_consistency' : 0}))
+    assert TSV("1\t2011-01-01\n") == TSV(
+        zero.query("SELECT * FROM test_insert_quorum_with_ttl", settings={'select_sequential_consistency': 0}))
 
     print("Resume fetches for test_insert_quorum_with_ttl at first replica.")
     first.query("SYSTEM START FETCHES test_insert_quorum_with_ttl")
@@ -279,7 +284,7 @@ def test_insert_quorum_with_ttl(started_cluster):
     first.query("SYSTEM SYNC REPLICA test_insert_quorum_with_ttl")
 
     zero.query("INSERT INTO test_insert_quorum_with_ttl(a,d) VALUES(1, '2011-01-01')",
-                                              settings={'insert_quorum_timeout' : 5000})
+               settings={'insert_quorum_timeout': 5000})
 
     print("Inserts should resume.")
     zero.query("INSERT INTO test_insert_quorum_with_ttl(a, d) VALUES(2, '2012-02-02')")
@@ -288,7 +293,9 @@ def test_insert_quorum_with_ttl(started_cluster):
     first.query("SYSTEM SYNC REPLICA test_insert_quorum_with_ttl")
     zero.query("SYSTEM SYNC REPLICA test_insert_quorum_with_ttl")
 
-    assert TSV("2\t2012-02-02\n") == TSV(first.query("SELECT * FROM test_insert_quorum_with_ttl", settings={'select_sequential_consistency' : 0}))
-    assert TSV("2\t2012-02-02\n") == TSV(first.query("SELECT * FROM test_insert_quorum_with_ttl", settings={'select_sequential_consistency' : 1}))
+    assert TSV("2\t2012-02-02\n") == TSV(
+        first.query("SELECT * FROM test_insert_quorum_with_ttl", settings={'select_sequential_consistency': 0}))
+    assert TSV("2\t2012-02-02\n") == TSV(
+        first.query("SELECT * FROM test_insert_quorum_with_ttl", settings={'select_sequential_consistency': 1}))
 
     execute_on_all_cluster("DROP TABLE IF EXISTS test_insert_quorum_with_ttl")
diff --git a/tests/integration/test_quota/test.py b/tests/integration/test_quota/test.py
index 4c97d127ad0..5d2a4acffe6 100644
--- a/tests/integration/test_quota/test.py
+++ b/tests/integration/test_quota/test.py
@@ -1,12 +1,15 @@
-import pytest
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry, TSV
 import os
 import re
 import time
 
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import assert_eq_with_retry, TSV
+
 cluster = ClickHouseCluster(__file__)
-instance = cluster.add_instance('instance', user_configs=["configs/users.d/assign_myquota.xml", "configs/users.d/drop_default_quota.xml", "configs/users.d/quota.xml"])
+instance = cluster.add_instance('instance', user_configs=["configs/users.d/assign_myquota.xml",
+                                                          "configs/users.d/drop_default_quota.xml",
+                                                          "configs/users.d/quota.xml"])
 
 
 def check_system_quotas(canonical):
@@ -15,35 +18,40 @@ def check_system_quotas(canonical):
     print("system_quotas: {},\ncanonical: {}".format(r, TSV(canonical_tsv)))
     assert r == canonical_tsv
 
+
 def system_quota_limits(canonical):
     canonical_tsv = TSV(canonical)
     r = TSV(instance.query("SELECT * FROM system.quota_limits ORDER BY quota_name, duration"))
     print("system_quota_limits: {},\ncanonical: {}".format(r, TSV(canonical_tsv)))
     assert r == canonical_tsv
 
+
 def system_quota_usage(canonical):
     canonical_tsv = TSV(canonical)
-    query = "SELECT quota_name, quota_key, duration, queries, max_queries, errors, max_errors, result_rows, max_result_rows,"\
-            "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time "\
+    query = "SELECT quota_name, quota_key, duration, queries, max_queries, errors, max_errors, result_rows, max_result_rows," \
+            "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time " \
             "FROM system.quota_usage ORDER BY duration"
     r = TSV(instance.query(query))
     print("system_quota_usage: {},\ncanonical: {}".format(r, TSV(canonical_tsv)))
     assert r == canonical_tsv
 
+
 def system_quotas_usage(canonical):
     canonical_tsv = TSV(canonical)
-    query = "SELECT quota_name, quota_key, is_current, duration, queries, max_queries, errors, max_errors, result_rows, max_result_rows, "\
-            "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time "\
+    query = "SELECT quota_name, quota_key, is_current, duration, queries, max_queries, errors, max_errors, result_rows, max_result_rows, " \
+            "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time " \
             "FROM system.quotas_usage ORDER BY quota_name, quota_key, duration"
     r = TSV(instance.query(query))
     print("system_quotas_usage: {},\ncanonical: {}".format(r, TSV(canonical_tsv)))
     assert r == canonical_tsv
 
-def copy_quota_xml(local_file_name, reload_immediately = True):
+
+def copy_quota_xml(local_file_name, reload_immediately=True):
     script_dir = os.path.dirname(os.path.realpath(__file__))
-    instance.copy_file_to_container(os.path.join(script_dir, local_file_name), '/etc/clickhouse-server/users.d/quota.xml')
+    instance.copy_file_to_container(os.path.join(script_dir, local_file_name),
+                                    '/etc/clickhouse-server/users.d/quota.xml')
     if reload_immediately:
-       instance.query("SYSTEM RELOAD CONFIG")
+        instance.query("SYSTEM RELOAD CONFIG")
 
 
 @pytest.fixture(scope="module", autouse=True)
@@ -66,52 +74,63 @@ def reset_quotas_and_usage_info():
         yield
     finally:
         instance.query("DROP QUOTA IF EXISTS qA, qB")
-        copy_quota_xml('simpliest.xml') # To reset usage info.
+        copy_quota_xml('simpliest.xml')  # To reset usage info.
         copy_quota_xml('normal_limits.xml')
 
 
 def test_quota_from_users_xml():
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952], 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952],
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
     system_quota_usage([["myQuota", "default", 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
-    system_quotas_usage([["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
+    system_quotas_usage(
+        [["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
 
     instance.query("SELECT * from test_table")
-    system_quota_usage([["myQuota", "default", 31556952, 1, 1000, 0, "\N", 50, "\N", 200, "\N", 50, 1000, 200, "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", 31556952, 1, 1000, 0, "\N", 50, "\N", 200, "\N", 50, 1000, 200, "\N", "\N"]])
 
     instance.query("SELECT COUNT() from test_table")
-    system_quota_usage([["myQuota", "default", 31556952, 2, 1000, 0, "\N", 51, "\N", 208, "\N", 50, 1000, 200, "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", 31556952, 2, 1000, 0, "\N", 51, "\N", 208, "\N", 50, 1000, 200, "\N", "\N"]])
 
 
 def test_simpliest_quota():
     # Simpliest quota doesn't even track usage.
     copy_quota_xml('simpliest.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[]", 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[]", 0,
+                          "['default']", "[]"]])
     system_quota_limits("")
-    system_quota_usage([["myQuota", "default", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
 
     instance.query("SELECT * from test_table")
-    system_quota_usage([["myQuota", "default", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
 
 
 def test_tracking_quota():
     # Now we're tracking usage.
     copy_quota_xml('tracking.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]", 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]",
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
     system_quota_usage([["myQuota", "default", 31556952, 0, "\N", 0, "\N", 0, "\N", 0, "\N", 0, "\N", 0, "\N", "\N"]])
 
     instance.query("SELECT * from test_table")
-    system_quota_usage([["myQuota", "default", 31556952, 1, "\N", 0, "\N", 50, "\N", 200, "\N", 50, "\N", 200, "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", 31556952, 1, "\N", 0, "\N", 50, "\N", 200, "\N", 50, "\N", 200, "\N", "\N"]])
 
     instance.query("SELECT COUNT() from test_table")
-    system_quota_usage([["myQuota", "default", 31556952, 2, "\N", 0, "\N", 51, "\N", 208, "\N", 50, "\N", 200, "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", 31556952, 2, "\N", 0, "\N", 51, "\N", 208, "\N", 50, "\N", 200, "\N", "\N"]])
 
 
 def test_exceed_quota():
     # Change quota, now the limits are tiny so we will exceed the quota.
     copy_quota_xml('tiny_limits.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]", 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]",
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1, 1, 1, "\N", 1, "\N", "\N"]])
     system_quota_usage([["myQuota", "default", 31556952, 0, 1, 0, 1, 0, 1, 0, "\N", 0, 1, 0, "\N", "\N"]])
 
@@ -120,75 +139,94 @@ def test_exceed_quota():
 
     # Change quota, now the limits are enough to execute queries.
     copy_quota_xml('normal_limits.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]", 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]",
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
     system_quota_usage([["myQuota", "default", 31556952, 1, 1000, 1, "\N", 0, "\N", 0, "\N", 50, 1000, 0, "\N", "\N"]])
 
     instance.query("SELECT * from test_table")
-    system_quota_usage([["myQuota", "default", 31556952, 2, 1000, 1, "\N", 50, "\N", 200, "\N", 100, 1000, 200, "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", 31556952, 2, 1000, 1, "\N", 50, "\N", 200, "\N", 100, 1000, 200, "\N", "\N"]])
 
 
 def test_add_remove_interval():
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952], 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952],
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
     system_quota_usage([["myQuota", "default", 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
 
     # Add interval.
     copy_quota_xml('two_intervals.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952,63113904]", 0, "['default']", "[]"]])
-    system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N",  1000, "\N",  "\N"],
-                                     ["myQuota", 63113904, 1, "\N", "\N", "\N", 30000, "\N", 20000, 120]])
-    system_quota_usage([["myQuota", "default", 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N",  0, 1000, 0, "\N",  "\N"],
-                                    ["myQuota", "default", 63113904, 0, "\N", 0, "\N", 0, "\N", 0, 30000, 0, "\N", 0, 20000, 120]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']",
+                          "[31556952,63113904]", 0, "['default']", "[]"]])
+    system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"],
+                         ["myQuota", 63113904, 1, "\N", "\N", "\N", 30000, "\N", 20000, 120]])
+    system_quota_usage([["myQuota", "default", 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"],
+                        ["myQuota", "default", 63113904, 0, "\N", 0, "\N", 0, "\N", 0, 30000, 0, "\N", 0, 20000, 120]])
 
     instance.query("SELECT * from test_table")
-    system_quota_usage([["myQuota", "default", 31556952, 1, 1000, 0, "\N", 50, "\N", 200, "\N",  50, 1000, 200, "\N",  "\N"],
-                                    ["myQuota", "default", 63113904, 1, "\N", 0, "\N", 50, "\N", 200, 30000, 50, "\N", 200, 20000, 120]])
+    system_quota_usage(
+        [["myQuota", "default", 31556952, 1, 1000, 0, "\N", 50, "\N", 200, "\N", 50, 1000, 200, "\N", "\N"],
+         ["myQuota", "default", 63113904, 1, "\N", 0, "\N", 50, "\N", 200, 30000, 50, "\N", 200, 20000, 120]])
 
     # Remove interval.
     copy_quota_xml('normal_limits.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952], 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952],
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
-    system_quota_usage([["myQuota", "default", 31556952, 1, 1000, 0, "\N", 50, "\N", 200, "\N",  50, 1000, 200,  "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", 31556952, 1, 1000, 0, "\N", 50, "\N", 200, "\N", 50, 1000, 200, "\N", "\N"]])
 
     instance.query("SELECT * from test_table")
-    system_quota_usage([["myQuota", "default", 31556952, 2, 1000, 0, "\N", 100, "\N", 400, "\N",  100, 1000, 400,  "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", 31556952, 2, 1000, 0, "\N", 100, "\N", 400, "\N", 100, 1000, 400, "\N", "\N"]])
 
     # Remove all intervals.
     copy_quota_xml('simpliest.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[]", 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[]", 0,
+                          "['default']", "[]"]])
     system_quota_limits("")
-    system_quota_usage([["myQuota", "default", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
 
     instance.query("SELECT * from test_table")
-    system_quota_usage([["myQuota", "default", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
+    system_quota_usage(
+        [["myQuota", "default", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N", "\N"]])
 
     # Add one interval back.
     copy_quota_xml('normal_limits.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952], 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952],
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
     system_quota_usage([["myQuota", "default", 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
 
 
 def test_add_remove_quota():
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952], 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", [31556952],
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
-    system_quotas_usage([["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
+    system_quotas_usage(
+        [["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
 
     # Add quota.
     copy_quota_xml('two_quotas.xml')
-    check_system_quotas([["myQuota",  "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']",              "[31556952]",     0, "['default']", "[]"],
-                         ["myQuota2", "4590510c-4d13-bf21-ec8a-c2187b092e73", "users.xml", "['client_key','user_name']", "[3600,2629746]", 0, "[]",          "[]"]])
-    system_quota_limits([["myQuota",  31556952, 0, 1000, "\N", "\N", "\N",   1000, "\N",   "\N"],
-                                     ["myQuota2", 3600,     1, "\N", "\N", 4000, 400000, 4000, 400000, 60],
-                                     ["myQuota2", 2629746,  0, "\N", "\N", "\N", "\N",   "\N", "\N",   1800]])
-    system_quotas_usage([["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]",
+                          0, "['default']", "[]"],
+                         ["myQuota2", "4590510c-4d13-bf21-ec8a-c2187b092e73", "users.xml", "['client_key','user_name']",
+                          "[3600,2629746]", 0, "[]", "[]"]])
+    system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"],
+                         ["myQuota2", 3600, 1, "\N", "\N", 4000, 400000, 4000, 400000, 60],
+                         ["myQuota2", 2629746, 0, "\N", "\N", "\N", "\N", "\N", "\N", 1800]])
+    system_quotas_usage(
+        [["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
 
     # Drop quota.
     copy_quota_xml('normal_limits.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]", 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]",
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
-    system_quotas_usage([["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
+    system_quotas_usage(
+        [["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
 
     # Drop all quotas.
     copy_quota_xml('no_quotas.xml')
@@ -198,32 +236,42 @@ def test_add_remove_quota():
 
     # Add one quota back.
     copy_quota_xml('normal_limits.xml')
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]", 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]",
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
-    system_quotas_usage([["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
+    system_quotas_usage(
+        [["myQuota", "default", 1, 31556952, 0, 1000, 0, "\N", 0, "\N", 0, "\N", 0, 1000, 0, "\N", "\N"]])
 
 
 def test_reload_users_xml_by_timer():
-    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]", 0, "['default']", "[]"]])
+    check_system_quotas([["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", "['user_name']", "[31556952]",
+                          0, "['default']", "[]"]])
     system_quota_limits([["myQuota", 31556952, 0, 1000, "\N", "\N", "\N", 1000, "\N", "\N"]])
 
-    time.sleep(1) # The modification time of the 'quota.xml' file should be different,
-                  # because config files are reload by timer only when the modification time is changed.
+    time.sleep(1)  # The modification time of the 'quota.xml' file should be different,
+    # because config files are reload by timer only when the modification time is changed.
     copy_quota_xml('tiny_limits.xml', reload_immediately=False)
-    assert_eq_with_retry(instance, "SELECT * FROM system.quotas", [["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", ['user_name'], "[31556952]", 0, "['default']", "[]"]])
-    assert_eq_with_retry(instance, "SELECT * FROM system.quota_limits", [["myQuota", 31556952, 0, 1, 1, 1, "\N", 1, "\N", "\N"]])
+    assert_eq_with_retry(instance, "SELECT * FROM system.quotas", [
+        ["myQuota", "e651da9c-a748-8703-061a-7e5e5096dae7", "users.xml", ['user_name'], "[31556952]", 0, "['default']",
+         "[]"]])
+    assert_eq_with_retry(instance, "SELECT * FROM system.quota_limits",
+                         [["myQuota", 31556952, 0, 1, 1, 1, "\N", 1, "\N", "\N"]])
 
 
 def test_dcl_introspection():
     assert instance.query("SHOW QUOTAS") == "myQuota\n"
-    assert instance.query("SHOW CREATE QUOTA") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
-    assert instance.query("SHOW CREATE QUOTAS") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
-    assert re.match("myQuota\\tdefault\\t.*\\t31556952\\t0\\t1000\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t1000\\t0\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert instance.query(
+        "SHOW CREATE QUOTA") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
+    assert instance.query(
+        "SHOW CREATE QUOTAS") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
+    assert re.match(
+        "myQuota\\tdefault\\t.*\\t31556952\\t0\\t1000\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t1000\\t0\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     instance.query("SELECT * from test_table")
-    assert re.match("myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert re.match(
+        "myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     expected_access = "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
     assert expected_access in instance.query("SHOW ACCESS")
@@ -231,20 +279,26 @@ def test_dcl_introspection():
     # Add interval.
     copy_quota_xml('two_intervals.xml')
     assert instance.query("SHOW QUOTAS") == "myQuota\n"
-    assert instance.query("SHOW CREATE QUOTA") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000, FOR RANDOMIZED INTERVAL 2 year MAX result_bytes = 30000, read_bytes = 20000, execution_time = 120 TO default\n"
-    assert re.match("myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\n"
-                    "myQuota\\tdefault\\t.*\\t63113904\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t30000\\t0\\t\\\\N\\t0\\t20000\\t.*\\t120",
-                    instance.query("SHOW QUOTA"))
+    assert instance.query(
+        "SHOW CREATE QUOTA") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000, FOR RANDOMIZED INTERVAL 2 year MAX result_bytes = 30000, read_bytes = 20000, execution_time = 120 TO default\n"
+    assert re.match(
+        "myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\n"
+        "myQuota\\tdefault\\t.*\\t63113904\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t30000\\t0\\t\\\\N\\t0\\t20000\\t.*\\t120",
+        instance.query("SHOW QUOTA"))
 
     # Drop interval, add quota.
     copy_quota_xml('two_quotas.xml')
     assert instance.query("SHOW QUOTAS") == "myQuota\nmyQuota2\n"
-    assert instance.query("SHOW CREATE QUOTA myQuota") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
-    assert instance.query("SHOW CREATE QUOTA myQuota2") == "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, FOR INTERVAL 1 month MAX execution_time = 1800\n"
-    assert instance.query("SHOW CREATE QUOTAS") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"\
-                                                   "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, FOR INTERVAL 1 month MAX execution_time = 1800\n"
-    assert re.match("myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert instance.query(
+        "SHOW CREATE QUOTA myQuota") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
+    assert instance.query(
+        "SHOW CREATE QUOTA myQuota2") == "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, FOR INTERVAL 1 month MAX execution_time = 1800\n"
+    assert instance.query(
+        "SHOW CREATE QUOTAS") == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n" \
+                                 "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, FOR INTERVAL 1 month MAX execution_time = 1800\n"
+    assert re.match(
+        "myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     # Drop all quotas.
     copy_quota_xml('no_quotas.xml')
@@ -258,41 +312,54 @@ def test_dcl_management():
     assert instance.query("SHOW QUOTA") == ""
 
     instance.query("CREATE QUOTA qA FOR INTERVAL 15 MONTH MAX QUERIES 123 TO CURRENT_USER")
-    assert instance.query("SHOW CREATE QUOTA qA") == "CREATE QUOTA qA FOR INTERVAL 5 quarter MAX queries = 123 TO default\n"
-    assert re.match("qA\\t\\t.*\\t39446190\\t0\\t123\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert instance.query(
+        "SHOW CREATE QUOTA qA") == "CREATE QUOTA qA FOR INTERVAL 5 quarter MAX queries = 123 TO default\n"
+    assert re.match(
+        "qA\\t\\t.*\\t39446190\\t0\\t123\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     instance.query("SELECT * from test_table")
-    assert re.match("qA\\t\\t.*\\t39446190\\t1\\t123\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert re.match(
+        "qA\\t\\t.*\\t39446190\\t1\\t123\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
-    instance.query("ALTER QUOTA qA FOR INTERVAL 15 MONTH MAX QUERIES 321, MAX ERRORS 10, FOR INTERVAL 0.5 HOUR MAX EXECUTION TIME 0.5")
-    assert instance.query("SHOW CREATE QUOTA qA") == "CREATE QUOTA qA FOR INTERVAL 30 minute MAX execution_time = 0.5, FOR INTERVAL 5 quarter MAX queries = 321, errors = 10 TO default\n"
-    assert re.match("qA\\t\\t.*\\t1800\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t0.5\n"
-                    "qA\\t\\t.*\\t39446190\\t1\\t321\\t0\\t10\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    instance.query(
+        "ALTER QUOTA qA FOR INTERVAL 15 MONTH MAX QUERIES 321, MAX ERRORS 10, FOR INTERVAL 0.5 HOUR MAX EXECUTION TIME 0.5")
+    assert instance.query(
+        "SHOW CREATE QUOTA qA") == "CREATE QUOTA qA FOR INTERVAL 30 minute MAX execution_time = 0.5, FOR INTERVAL 5 quarter MAX queries = 321, errors = 10 TO default\n"
+    assert re.match(
+        "qA\\t\\t.*\\t1800\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t0.5\n"
+        "qA\\t\\t.*\\t39446190\\t1\\t321\\t0\\t10\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     instance.query("SELECT * from test_table")
-    assert re.match("qA\\t\\t.*\\t1800\\t1\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t0.5\n"
-                    "qA\\t\\t.*\\t39446190\\t2\\t321\\t0\\t10\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert re.match(
+        "qA\\t\\t.*\\t1800\\t1\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t0.5\n"
+        "qA\\t\\t.*\\t39446190\\t2\\t321\\t0\\t10\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
-    instance.query("ALTER QUOTA qA FOR INTERVAL 15 MONTH NO LIMITS, FOR RANDOMIZED INTERVAL 16 MONTH TRACKING ONLY, FOR INTERVAL 1800 SECOND NO LIMITS")
-    assert re.match("qA\\t\\t.*\\t42075936\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    instance.query(
+        "ALTER QUOTA qA FOR INTERVAL 15 MONTH NO LIMITS, FOR RANDOMIZED INTERVAL 16 MONTH TRACKING ONLY, FOR INTERVAL 1800 SECOND NO LIMITS")
+    assert re.match(
+        "qA\\t\\t.*\\t42075936\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     instance.query("SELECT * from test_table")
-    assert re.match("qA\\t\\t.*\\t42075936\\t1\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert re.match(
+        "qA\\t\\t.*\\t42075936\\t1\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     instance.query("ALTER QUOTA qA RENAME TO qB")
-    assert instance.query("SHOW CREATE QUOTA qB") == "CREATE QUOTA qB FOR RANDOMIZED INTERVAL 16 month TRACKING ONLY TO default\n"
-    assert re.match("qB\\t\\t.*\\t42075936\\t1\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert instance.query(
+        "SHOW CREATE QUOTA qB") == "CREATE QUOTA qB FOR RANDOMIZED INTERVAL 16 month TRACKING ONLY TO default\n"
+    assert re.match(
+        "qB\\t\\t.*\\t42075936\\t1\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     instance.query("SELECT * from test_table")
-    assert re.match("qB\\t\\t.*\\t42075936\\t2\\t\\\\N\\t0\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\n",
-                    instance.query("SHOW QUOTA"))
+    assert re.match(
+        "qB\\t\\t.*\\t42075936\\t2\\t\\\\N\\t0\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\n",
+        instance.query("SHOW QUOTA"))
 
     instance.query("DROP QUOTA qB")
     assert instance.query("SHOW QUOTA") == ""
diff --git a/tests/integration/test_random_inserts/test.py b/tests/integration/test_random_inserts/test.py
index 4e3d8db7e53..f43581b6482 100644
--- a/tests/integration/test_random_inserts/test.py
+++ b/tests/integration/test_random_inserts/test.py
@@ -1,23 +1,25 @@
-import time
 import os
-import threading
 import random
-from contextlib import contextmanager
+import threading
+import time
 
 import pytest
-
+from helpers.client import CommandRequest
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
 from helpers.test_tools import TSV
-from helpers.client import CommandRequest
-
 
 cluster = ClickHouseCluster(__file__)
 
-node1 = cluster.add_instance('node1', main_configs=["configs/conf.d/merge_tree.xml", "configs/conf.d/remote_servers.xml" ], with_zookeeper=True, macros={"layer": 0, "shard": 0, "replica": 1})
-node2 = cluster.add_instance('node2', main_configs=["configs/conf.d/merge_tree.xml", "configs/conf.d/remote_servers.xml" ], with_zookeeper=True, macros={"layer": 0, "shard": 0, "replica": 2})
+node1 = cluster.add_instance('node1',
+                             main_configs=["configs/conf.d/merge_tree.xml", "configs/conf.d/remote_servers.xml"],
+                             with_zookeeper=True, macros={"layer": 0, "shard": 0, "replica": 1})
+node2 = cluster.add_instance('node2',
+                             main_configs=["configs/conf.d/merge_tree.xml", "configs/conf.d/remote_servers.xml"],
+                             with_zookeeper=True, macros={"layer": 0, "shard": 0, "replica": 2})
 nodes = [node1, node2]
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -31,7 +33,7 @@ def started_cluster():
 
 def test_random_inserts(started_cluster):
     # Duration of the test, reduce it if don't want to wait
-    DURATION_SECONDS = 10# * 60
+    DURATION_SECONDS = 10  # * 60
 
     node1.query("""
         CREATE TABLE simple ON CLUSTER test_cluster (date Date, i UInt32, s String)
@@ -39,9 +41,9 @@ def test_random_inserts(started_cluster):
 
     with PartitionManager() as pm_random_drops:
         for sacrifice in nodes:
-            pass # This test doesn't work with partition problems still
-            #pm_random_drops._add_rule({'probability': 0.01, 'destination': sacrifice.ip_address, 'source_port': 2181, 'action': 'REJECT --reject-with tcp-reset'})
-            #pm_random_drops._add_rule({'probability': 0.01, 'source': sacrifice.ip_address, 'destination_port': 2181, 'action': 'REJECT --reject-with tcp-reset'})
+            pass  # This test doesn't work with partition problems still
+            # pm_random_drops._add_rule({'probability': 0.01, 'destination': sacrifice.ip_address, 'source_port': 2181, 'action': 'REJECT --reject-with tcp-reset'})
+            # pm_random_drops._add_rule({'probability': 0.01, 'source': sacrifice.ip_address, 'destination_port': 2181, 'action': 'REJECT --reject-with tcp-reset'})
 
         min_timestamp = int(time.time())
         max_timestamp = min_timestamp + DURATION_SECONDS
@@ -50,18 +52,21 @@ def test_random_inserts(started_cluster):
         bash_script = os.path.join(os.path.dirname(__file__), "test.sh")
         inserters = []
         for node in nodes:
-            cmd = ['/bin/bash', bash_script, node.ip_address, str(min_timestamp), str(max_timestamp), str(cluster.get_client_cmd())]
+            cmd = ['/bin/bash', bash_script, node.ip_address, str(min_timestamp), str(max_timestamp),
+                   str(cluster.get_client_cmd())]
             inserters.append(CommandRequest(cmd, timeout=DURATION_SECONDS * 2, stdin=''))
             print node.name, node.ip_address
 
         for inserter in inserters:
             inserter.get_answer()
 
-    answer="{}\t{}\t{}\t{}\n".format(num_timestamps, num_timestamps, min_timestamp, max_timestamp)
+    answer = "{}\t{}\t{}\t{}\n".format(num_timestamps, num_timestamps, min_timestamp, max_timestamp)
 
     for node in nodes:
-        res = node.query_with_retry("SELECT count(), uniqExact(i), min(i), max(i) FROM simple", check_callback=lambda res: TSV(res) == TSV(answer))
-        assert TSV(res) == TSV(answer), node.name + " : " + node.query("SELECT groupArray(_part), i, count() AS c FROM simple GROUP BY i ORDER BY c DESC LIMIT 1")
+        res = node.query_with_retry("SELECT count(), uniqExact(i), min(i), max(i) FROM simple",
+                                    check_callback=lambda res: TSV(res) == TSV(answer))
+        assert TSV(res) == TSV(answer), node.name + " : " + node.query(
+            "SELECT groupArray(_part), i, count() AS c FROM simple GROUP BY i ORDER BY c DESC LIMIT 1")
 
     node1.query("""DROP TABLE simple ON CLUSTER test_cluster""")
 
@@ -114,13 +119,14 @@ def test_insert_multithreaded(started_cluster):
         node.query("DROP TABLE IF EXISTS repl_test")
 
     for node in nodes:
-        node.query("CREATE TABLE repl_test(d Date, x UInt32) ENGINE ReplicatedMergeTree('/clickhouse/tables/test/repl_test', '{replica}') ORDER BY x PARTITION BY toYYYYMM(d)")
+        node.query(
+            "CREATE TABLE repl_test(d Date, x UInt32) ENGINE ReplicatedMergeTree('/clickhouse/tables/test/repl_test', '{replica}') ORDER BY x PARTITION BY toYYYYMM(d)")
 
     runner = Runner()
 
     threads = []
     for thread_num in range(5):
-        threads.append(threading.Thread(target=runner.do_insert, args=(thread_num, )))
+        threads.append(threading.Thread(target=runner.do_insert, args=(thread_num,)))
 
     for t in threads:
         t.start()
@@ -135,7 +141,7 @@ def test_insert_multithreaded(started_cluster):
     assert runner.total_inserted > 0
 
     all_replicated = False
-    for i in range(100): # wait for replication 50 seconds max
+    for i in range(100):  # wait for replication 50 seconds max
         time.sleep(0.5)
 
         def get_delay(node):
diff --git a/tests/integration/test_range_hashed_dictionary_types/test.py b/tests/integration/test_range_hashed_dictionary_types/test.py
index 24d4d5d4094..198e2e27db8 100644
--- a/tests/integration/test_range_hashed_dictionary_types/test.py
+++ b/tests/integration/test_range_hashed_dictionary_types/test.py
@@ -1,7 +1,7 @@
 import pytest
 
-
 from helpers.cluster import ClickHouseCluster
+
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1')
@@ -39,4 +39,5 @@ def test_range_hashed_dict(started_cluster):
     """)
     node1.query("SYSTEM RELOAD DICTIONARY default.rates")
 
-    assert node1.query("SELECT dictGetString('default.rates', 'currency', toUInt64(4990954156238030839), toDateTime('2019-10-01 00:00:00'))") == "RU\n"
+    assert node1.query(
+        "SELECT dictGetString('default.rates', 'currency', toUInt64(4990954156238030839), toDateTime('2019-10-01 00:00:00'))") == "RU\n"
diff --git a/tests/integration/test_read_temporary_tables_on_failure/test.py b/tests/integration/test_read_temporary_tables_on_failure/test.py
index ad1a41b8979..f7df52f67e9 100644
--- a/tests/integration/test_read_temporary_tables_on_failure/test.py
+++ b/tests/integration/test_read_temporary_tables_on_failure/test.py
@@ -1,13 +1,12 @@
 import pytest
-import time
-
-from helpers.cluster import ClickHouseCluster
 from helpers.client import QueryTimeoutExceedException, QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 
 node = cluster.add_instance('node')
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -17,6 +16,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_different_versions(start_cluster):
     with pytest.raises(QueryTimeoutExceedException):
         node.query("SELECT sleep(3)", timeout=1)
diff --git a/tests/integration/test_recompression_ttl/test.py b/tests/integration/test_recompression_ttl/test.py
index 4707a5c41ad..9a96151d04a 100644
--- a/tests/integration/test_recompression_ttl/test.py
+++ b/tests/integration/test_recompression_ttl/test.py
@@ -1,15 +1,13 @@
 import time
+
 import pytest
-
-import helpers.client as client
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
-
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/background_pool_config.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/background_pool_config.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -47,12 +45,15 @@ def optimize_final_table_until_success(node, table_name, retries=40):
 
 def wait_part_and_get_compression_codec(node, table, part_name, retries=40):
     if wait_part_in_parts(node, table, part_name, retries):
-        return node.query("SELECT default_compression_codec FROM system.parts where name = '{}' and table = '{}'".format(part_name, table)).strip()
+        return node.query(
+            "SELECT default_compression_codec FROM system.parts where name = '{}' and table = '{}'".format(part_name,
+                                                                                                           table)).strip()
     return None
 
 
 def test_recompression_simple(started_cluster):
-    node1.query("CREATE TABLE table_for_recompression (d DateTime, key UInt64, data String) ENGINE MergeTree() ORDER BY tuple() TTL d + INTERVAL 10 SECOND RECOMPRESS CODEC(ZSTD(10)) SETTINGS merge_with_recompression_ttl_timeout = 0")
+    node1.query(
+        "CREATE TABLE table_for_recompression (d DateTime, key UInt64, data String) ENGINE MergeTree() ORDER BY tuple() TTL d + INTERVAL 10 SECOND RECOMPRESS CODEC(ZSTD(10)) SETTINGS merge_with_recompression_ttl_timeout = 0")
     node1.query("INSERT INTO table_for_recompression VALUES (now(), 1, '1')")
 
     assert node1.query("SELECT default_compression_codec FROM system.parts where name = 'all_1_1_0'") == "LZ4\n"
@@ -106,20 +107,24 @@ def test_recompression_multiple_ttls(started_cluster):
 
     assert node2.query("SELECT default_compression_codec FROM system.parts where name = 'all_1_1_4'") == "ZSTD(12)\n"
 
-    assert node2.query("SELECT recompression_ttl_info.expression FROM system.parts where name = 'all_1_1_4'") == "['plus(d, toIntervalSecond(10))','plus(d, toIntervalSecond(15))','plus(d, toIntervalSecond(5))']\n"
+    assert node2.query(
+        "SELECT recompression_ttl_info.expression FROM system.parts where name = 'all_1_1_4'") == "['plus(d, toIntervalSecond(10))','plus(d, toIntervalSecond(15))','plus(d, toIntervalSecond(5))']\n"
 
 
 def test_recompression_replicated(started_cluster):
     for i, node in enumerate([node1, node2]):
         node.query("CREATE TABLE recompression_replicated (d DateTime, key UInt64, data String) \
         ENGINE ReplicatedMergeTree('/test/rr', '{}') ORDER BY tuple() \
-        TTL d + INTERVAL 10 SECOND RECOMPRESS CODEC(ZSTD(13)) SETTINGS merge_with_recompression_ttl_timeout = 0".format(i + 1))
+        TTL d + INTERVAL 10 SECOND RECOMPRESS CODEC(ZSTD(13)) SETTINGS merge_with_recompression_ttl_timeout = 0".format(
+            i + 1))
 
     node1.query("INSERT INTO recompression_replicated VALUES (now(), 1, '1')")
     node2.query("SYSTEM SYNC REPLICA recompression_replicated", timeout=5)
 
-    assert node1.query("SELECT default_compression_codec FROM system.parts where name = 'all_0_0_0' and table = 'recompression_replicated'") == "LZ4\n"
-    assert node2.query("SELECT default_compression_codec FROM system.parts where name = 'all_0_0_0' and table = 'recompression_replicated'") == "LZ4\n"
+    assert node1.query(
+        "SELECT default_compression_codec FROM system.parts where name = 'all_0_0_0' and table = 'recompression_replicated'") == "LZ4\n"
+    assert node2.query(
+        "SELECT default_compression_codec FROM system.parts where name = 'all_0_0_0' and table = 'recompression_replicated'") == "LZ4\n"
 
     codec1 = wait_part_and_get_compression_codec(node1, "recompression_replicated", "all_0_0_1")
     if not codec1:
diff --git a/tests/integration/test_recovery_replica/test.py b/tests/integration/test_recovery_replica/test.py
index d2a53144d98..74e773cfb83 100644
--- a/tests/integration/test_recovery_replica/test.py
+++ b/tests/integration/test_recovery_replica/test.py
@@ -1,23 +1,26 @@
 import time
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
+
 def fill_nodes(nodes, shard):
     for node in nodes:
         node.query(
-        '''
-            CREATE DATABASE test;
+            '''
+                CREATE DATABASE test;
+    
+                CREATE TABLE test_table(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
+            '''.format(shard=shard, replica=node.name))
 
-            CREATE TABLE test_table(date Date, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date) SETTINGS min_replicated_logs_to_keep=3, max_replicated_logs_to_keep=5, cleanup_delay_period=0, cleanup_delay_period_random_add=0;
-        '''.format(shard=shard, replica=node.name))
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -33,6 +36,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_recovery(start_cluster):
     node1.query("INSERT INTO test_table VALUES (1, 1)")
     time.sleep(1)
@@ -41,6 +45,7 @@ def test_recovery(start_cluster):
     for i in range(100):
         node1.query("INSERT INTO test_table VALUES (1, {})".format(i))
 
-    node2.query_with_retry("ATTACH TABLE test_table", check_callback=lambda x: len(node2.query("select * from test_table")) > 0)
+    node2.query_with_retry("ATTACH TABLE test_table",
+                           check_callback=lambda x: len(node2.query("select * from test_table")) > 0)
 
     assert_eq_with_retry(node2, "SELECT count(*) FROM test_table", node1.query("SELECT count(*) FROM test_table"))
diff --git a/tests/integration/test_redirect_url_storage/test.py b/tests/integration/test_redirect_url_storage/test.py
index cf64e84b96b..f93548af0db 100644
--- a/tests/integration/test_redirect_url_storage/test.py
+++ b/tests/integration/test_redirect_url_storage/test.py
@@ -1,11 +1,11 @@
 import pytest
-from helpers.hdfs_api import HDFSApi
-
 from helpers.cluster import ClickHouseCluster
+from helpers.hdfs_api import HDFSApi
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', with_zookeeper=False, with_hdfs=True)
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -15,25 +15,30 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_url_without_redirect(started_cluster):
     hdfs_api = HDFSApi("root")
     hdfs_api.write_data("/simple_storage", "1\tMark\t72.53\n")
     assert hdfs_api.read_data("/simple_storage") == "1\tMark\t72.53\n"
 
     # access datanode port directly
-    node1.query("create table WebHDFSStorage (id UInt32, name String, weight Float64) ENGINE = URL('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV')")
+    node1.query(
+        "create table WebHDFSStorage (id UInt32, name String, weight Float64) ENGINE = URL('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV')")
     assert node1.query("select * from WebHDFSStorage") == "1\tMark\t72.53\n"
 
+
 def test_url_with_redirect_not_allowed(started_cluster):
     hdfs_api = HDFSApi("root")
     hdfs_api.write_data("/simple_storage", "1\tMark\t72.53\n")
     assert hdfs_api.read_data("/simple_storage") == "1\tMark\t72.53\n"
 
     # access proxy port without allowing redirects
-    node1.query("create table WebHDFSStorageWithoutRedirect (id UInt32, name String, weight Float64) ENGINE = URL('http://hdfs1:50070/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV')")
+    node1.query(
+        "create table WebHDFSStorageWithoutRedirect (id UInt32, name String, weight Float64) ENGINE = URL('http://hdfs1:50070/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV')")
     with pytest.raises(Exception):
         assert node1.query("select * from WebHDFSStorageWithoutRedirect") == "1\tMark\t72.53\n"
 
+
 def test_url_with_redirect_allowed(started_cluster):
     hdfs_api = HDFSApi("root")
     hdfs_api.write_data("/simple_storage", "1\tMark\t72.53\n")
@@ -41,5 +46,6 @@ def test_url_with_redirect_allowed(started_cluster):
 
     # access proxy port with allowing redirects
     # http://localhost:50070/webhdfs/v1/b?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0
-    node1.query("create table WebHDFSStorageWithRedirect (id UInt32, name String, weight Float64) ENGINE = URL('http://hdfs1:50070/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV')")
+    node1.query(
+        "create table WebHDFSStorageWithRedirect (id UInt32, name String, weight Float64) ENGINE = URL('http://hdfs1:50070/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV')")
     assert node1.query("SET max_http_get_redirects=1; select * from WebHDFSStorageWithRedirect") == "1\tMark\t72.53\n"
diff --git a/tests/integration/test_relative_filepath/test.py b/tests/integration/test_relative_filepath/test.py
index a8e2341a3cd..45c969b86f5 100644
--- a/tests/integration/test_relative_filepath/test.py
+++ b/tests/integration/test_relative_filepath/test.py
@@ -6,6 +6,7 @@ cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', main_configs=['configs/config.xml'])
 path_to_userfiles_from_defaut_config = "user_files"
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -14,6 +15,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_filepath(start_cluster):
     # 2 rows data
     some_data = "Test\t111.222\nData\t333.444"
diff --git a/tests/integration/test_reload_max_table_size_to_drop/test.py b/tests/integration/test_reload_max_table_size_to_drop/test.py
index 9d0bc244521..d6bdcc83945 100644
--- a/tests/integration/test_reload_max_table_size_to_drop/test.py
+++ b/tests/integration/test_reload_max_table_size_to_drop/test.py
@@ -1,11 +1,9 @@
-
-import time
-import pytest
 import os
+import time
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
-
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', main_configs=["configs/max_table_size_to_drop.xml"])
 
diff --git a/tests/integration/test_reloading_storage_configuration/test.py b/tests/integration/test_reloading_storage_configuration/test.py
index a30d4029d7c..0c3139c7fdd 100644
--- a/tests/integration/test_reloading_storage_configuration/test.py
+++ b/tests/integration/test_reloading_storage_configuration/test.py
@@ -5,27 +5,27 @@ import shutil
 import time
 import xml.etree.ElementTree as ET
 
-import pytest
-
 import helpers.client
 import helpers.cluster
-
+import pytest
 
 cluster = helpers.cluster.ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1',
-            main_configs=['configs/logs_config.xml'],
-            with_zookeeper=True,
-            stay_alive=True,
-            tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/jbod3:size=40M', '/jbod4:size=40M', '/external:size=200M'],
-            macros={"shard": 0, "replica": 1} )
+                             main_configs=['configs/logs_config.xml'],
+                             with_zookeeper=True,
+                             stay_alive=True,
+                             tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/jbod3:size=40M', '/jbod4:size=40M',
+                                    '/external:size=200M'],
+                             macros={"shard": 0, "replica": 1})
 
 node2 = cluster.add_instance('node2',
-            main_configs=['configs/logs_config.xml'],
-            with_zookeeper=True,
-            stay_alive=True,
-            tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/jbod3:size=40M', '/jbod4:size=40M', '/external:size=200M'],
-            macros={"shard": 0, "replica": 2} )
+                             main_configs=['configs/logs_config.xml'],
+                             with_zookeeper=True,
+                             stay_alive=True,
+                             tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/jbod3:size=40M', '/jbod4:size=40M',
+                                    '/external:size=200M'],
+                             macros={"shard": 0, "replica": 2})
 
 
 def get_log(node):
@@ -43,7 +43,8 @@ def started_cluster():
 
 
 def start_over():
-    shutil.copy(os.path.join(os.path.dirname(__file__), "configs/config.d/storage_configuration.xml"), os.path.join(node1.config_d_dir, "storage_configuration.xml"))
+    shutil.copy(os.path.join(os.path.dirname(__file__), "configs/config.d/storage_configuration.xml"),
+                os.path.join(node1.config_d_dir, "storage_configuration.xml"))
 
     for node in (node1, node2):
         separate_configuration_path = os.path.join(node.config_d_dir, "separate_configuration.xml")
@@ -62,7 +63,8 @@ def add_disk(node, name, path, separate_file=False):
         else:
             tree = ET.parse(os.path.join(node.config_d_dir, "storage_configuration.xml"))
     except:
-        tree = ET.ElementTree(ET.fromstring('<yandex><storage_configuration><disks/><policies/></storage_configuration></yandex>'))
+        tree = ET.ElementTree(
+            ET.fromstring('<yandex><storage_configuration><disks/><policies/></storage_configuration></yandex>'))
     root = tree.getroot()
     new_disk = ET.Element(name)
     new_path = ET.Element("path")
@@ -178,8 +180,10 @@ def test_add_policy(started_cluster):
 
         disks = set(node1.query("SELECT name FROM system.disks").splitlines())
         assert "cool_policy" in set(node1.query("SELECT policy_name FROM system.storage_policies").splitlines())
-        assert {"volume1"} == set(node1.query("SELECT volume_name FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
-        assert {"['jbod3','jbod4']"} == set(node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
+        assert {"volume1"} == set(node1.query(
+            "SELECT volume_name FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
+        assert {"['jbod3','jbod4']"} == set(
+            node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
 
     finally:
         try:
@@ -218,7 +222,8 @@ def test_new_policy_works(started_cluster):
         start_over()
         add_disk(node1, "jbod3", "/jbod3/")
         add_disk(node1, "jbod4", "/jbod4/")
-        add_policy(node1, "cool_policy", collections.OrderedDict([("volume1", ["jbod3"]), ("main", ["jbod1", "jbod2"]), ("external", ["external"])]))
+        add_policy(node1, "cool_policy", collections.OrderedDict(
+            [("volume1", ["jbod3"]), ("main", ["jbod1", "jbod2"]), ("external", ["external"])]))
         node1.query("SYSTEM RELOAD CONFIG")
 
         node1.query("""
@@ -228,7 +233,8 @@ def test_new_policy_works(started_cluster):
         node1.query("""
             INSERT INTO TABLE {name} VALUES (1)
         """.format(name=name))
-        assert {"jbod3"} == set(node1.query("SELECT disk_name FROM system.parts WHERE active = 1 AND table = '{name}'".format(name=name)).splitlines())
+        assert {"jbod3"} == set(node1.query(
+            "SELECT disk_name FROM system.parts WHERE active = 1 AND table = '{name}'".format(name=name)).splitlines())
 
     finally:
         try:
@@ -263,8 +269,10 @@ def test_add_volume_to_policy(started_cluster):
         add_policy(node1, "cool_policy", collections.OrderedDict([("volume1", ["jbod3"]), ("volume2", ["jbod4"])]))
         node1.query("SYSTEM RELOAD CONFIG")
 
-        volumes = set(node1.query("SELECT volume_name FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
-        disks_sets = set(node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
+        volumes = set(node1.query(
+            "SELECT volume_name FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
+        disks_sets = set(
+            node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
         assert {"volume1", "volume2"} == volumes
         assert {"['jbod3']", "['jbod4']"} == disks_sets
 
@@ -298,11 +306,13 @@ def test_add_disk_to_policy(started_cluster):
         start_over()
         add_disk(node1, "jbod3", "/jbod3/")
         add_disk(node1, "jbod4", "/jbod4/")
-        add_policy(node1, "cool_policy", {"volume1": ["jbod3","jbod4"]})
+        add_policy(node1, "cool_policy", {"volume1": ["jbod3", "jbod4"]})
         node1.query("SYSTEM RELOAD CONFIG")
 
-        volumes = set(node1.query("SELECT volume_name FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
-        disks_sets = set(node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
+        volumes = set(node1.query(
+            "SELECT volume_name FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
+        disks_sets = set(
+            node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'cool_policy'").splitlines())
         assert {"volume1"} == volumes
         assert {"['jbod3','jbod4']"} == disks_sets
 
@@ -365,14 +375,16 @@ def test_remove_policy(started_cluster):
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
 
-        assert "remove_policy_cool_policy" in set(node1.query("SELECT policy_name FROM system.storage_policies").splitlines())
+        assert "remove_policy_cool_policy" in set(
+            node1.query("SELECT policy_name FROM system.storage_policies").splitlines())
 
         start_over()
         add_disk(node1, "jbod3", "/jbod3/")
         add_disk(node1, "jbod4", "/jbod4/")
         node1.query("SYSTEM RELOAD CONFIG")
 
-        assert "remove_policy_cool_policy" in set(node1.query("SELECT policy_name FROM system.storage_policies").splitlines())
+        assert "remove_policy_cool_policy" in set(
+            node1.query("SELECT policy_name FROM system.storage_policies").splitlines())
         assert re.search("Error.*remove_policy_cool_policy", get_log(node1))
 
     finally:
@@ -390,7 +402,8 @@ def test_remove_volume_from_policy(started_cluster):
         start_over()
         add_disk(node1, "jbod3", "/jbod3/")
         add_disk(node1, "jbod4", "/jbod4/")
-        add_policy(node1, "test_remove_volume_from_policy_cool_policy", collections.OrderedDict([("volume1", ["jbod3"]), ("volume2", ["jbod4"])]))
+        add_policy(node1, "test_remove_volume_from_policy_cool_policy",
+                   collections.OrderedDict([("volume1", ["jbod3"]), ("volume2", ["jbod4"])]))
         node1.restart_clickhouse(kill=True)
         time.sleep(2)
 
@@ -402,8 +415,10 @@ def test_remove_volume_from_policy(started_cluster):
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
 
-        volumes = set(node1.query("SELECT volume_name FROM system.storage_policies WHERE policy_name = 'test_remove_volume_from_policy_cool_policy'").splitlines())
-        disks_sets = set(node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'test_remove_volume_from_policy_cool_policy'").splitlines())
+        volumes = set(node1.query(
+            "SELECT volume_name FROM system.storage_policies WHERE policy_name = 'test_remove_volume_from_policy_cool_policy'").splitlines())
+        disks_sets = set(node1.query(
+            "SELECT disks FROM system.storage_policies WHERE policy_name = 'test_remove_volume_from_policy_cool_policy'").splitlines())
         assert {"volume1", "volume2"} == volumes
         assert {"['jbod3']", "['jbod4']"} == disks_sets
 
@@ -413,8 +428,10 @@ def test_remove_volume_from_policy(started_cluster):
         add_policy(node1, "cool_policy", {"volume1": ["jbod3"]})
         node1.query("SYSTEM RELOAD CONFIG")
 
-        volumes = set(node1.query("SELECT volume_name FROM system.storage_policies WHERE policy_name = 'test_remove_volume_from_policy_cool_policy'").splitlines())
-        disks_sets = set(node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'test_remove_volume_from_policy_cool_policy'").splitlines())
+        volumes = set(node1.query(
+            "SELECT volume_name FROM system.storage_policies WHERE policy_name = 'test_remove_volume_from_policy_cool_policy'").splitlines())
+        disks_sets = set(node1.query(
+            "SELECT disks FROM system.storage_policies WHERE policy_name = 'test_remove_volume_from_policy_cool_policy'").splitlines())
         assert {"volume1", "volume2"} == volumes
         assert {"['jbod3']", "['jbod4']"} == disks_sets
         assert re.search("Error.*test_remove_volume_from_policy_cool_policy", get_log(node1))
@@ -434,7 +451,7 @@ def test_remove_disk_from_policy(started_cluster):
         start_over()
         add_disk(node1, "jbod3", "/jbod3/")
         add_disk(node1, "jbod4", "/jbod4/")
-        add_policy(node1, "test_remove_disk_from_policy_cool_policy", {"volume1": ["jbod3","jbod4"]})
+        add_policy(node1, "test_remove_disk_from_policy_cool_policy", {"volume1": ["jbod3", "jbod4"]})
         node1.restart_clickhouse(kill=True)
         time.sleep(2)
 
@@ -446,8 +463,10 @@ def test_remove_disk_from_policy(started_cluster):
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
 
-        volumes = set(node1.query("SELECT volume_name FROM system.storage_policies WHERE policy_name = 'test_remove_disk_from_policy_cool_policy'").splitlines())
-        disks_sets = set(node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'test_remove_disk_from_policy_cool_policy'").splitlines())
+        volumes = set(node1.query(
+            "SELECT volume_name FROM system.storage_policies WHERE policy_name = 'test_remove_disk_from_policy_cool_policy'").splitlines())
+        disks_sets = set(node1.query(
+            "SELECT disks FROM system.storage_policies WHERE policy_name = 'test_remove_disk_from_policy_cool_policy'").splitlines())
         assert {"volume1"} == volumes
         assert {"['jbod3','jbod4']"} == disks_sets
 
@@ -457,8 +476,10 @@ def test_remove_disk_from_policy(started_cluster):
         add_policy(node1, "cool_policy", {"volume1": ["jbod3"]})
         node1.query("SYSTEM RELOAD CONFIG")
 
-        volumes = set(node1.query("SELECT volume_name FROM system.storage_policies WHERE policy_name = 'test_remove_disk_from_policy_cool_policy'").splitlines())
-        disks_sets = set(node1.query("SELECT disks FROM system.storage_policies WHERE policy_name = 'test_remove_disk_from_policy_cool_policy'").splitlines())
+        volumes = set(node1.query(
+            "SELECT volume_name FROM system.storage_policies WHERE policy_name = 'test_remove_disk_from_policy_cool_policy'").splitlines())
+        disks_sets = set(node1.query(
+            "SELECT disks FROM system.storage_policies WHERE policy_name = 'test_remove_disk_from_policy_cool_policy'").splitlines())
         assert {"volume1"} == volumes
         assert {"['jbod3','jbod4']"} == disks_sets
         assert re.search("Error.*test_remove_disk_from_policy_cool_policy", get_log(node1))
diff --git a/tests/integration/test_remote_prewhere/test.py b/tests/integration/test_remote_prewhere/test.py
index 5cf3836213e..07d05797223 100644
--- a/tests/integration/test_remote_prewhere/test.py
+++ b/tests/integration/test_remote_prewhere/test.py
@@ -1,14 +1,12 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
-from helpers.client import QueryRuntimeException, QueryTimeoutExceedException
-
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/log_conf.xml'])
 node2 = cluster.add_instance('node2', main_configs=['configs/log_conf.xml'])
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -32,4 +30,5 @@ def start_cluster():
 
 
 def test_remote(start_cluster):
-    assert node1.query("SELECT 1 FROM remote('node{1,2}', default.test_table) WHERE (APIKey = 137715) AND (CustomAttributeId IN (45, 66)) AND (ProfileIDHash != 0) LIMIT 1") == ""
+    assert node1.query(
+        "SELECT 1 FROM remote('node{1,2}', default.test_table) WHERE (APIKey = 137715) AND (CustomAttributeId IN (45, 66)) AND (ProfileIDHash != 0) LIMIT 1") == ""
diff --git a/tests/integration/test_rename_column/test.py b/tests/integration/test_rename_column/test.py
index 9a108583347..51921c3385c 100644
--- a/tests/integration/test_rename_column/test.py
+++ b/tests/integration/test_rename_column/test.py
@@ -1,14 +1,12 @@
 from __future__ import print_function
 
-import time
 import random
-import pytest
-
+import time
 from multiprocessing.dummy import Pool
-from helpers.cluster import ClickHouseCluster
+
+import pytest
 from helpers.client import QueryRuntimeException
-from helpers.network import PartitionManager
-from helpers.test_tools import TSV
+from helpers.cluster import ClickHouseCluster
 
 node_options = dict(
     with_zookeeper=True,
@@ -83,7 +81,7 @@ def create_table(nodes, table_name, with_storage_policy=False, with_time_column=
 
 
 def create_distributed_table(node, table_name):
-        sql = """
+    sql = """
             CREATE TABLE %(table_name)s_replicated ON CLUSTER test_cluster
             (
                 num UInt32,
@@ -92,12 +90,12 @@ def create_distributed_table(node, table_name):
             ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/%(table_name)s_replicated', '{replica}')
             ORDER BY num PARTITION BY num %% 100;
         """ % dict(table_name=table_name)
-        node.query(sql)
-        sql = """
+    node.query(sql)
+    sql = """
             CREATE TABLE %(table_name)s ON CLUSTER test_cluster AS %(table_name)s_replicated
             ENGINE = Distributed(test_cluster, default, %(table_name)s_replicated, rand())
         """ % dict(table_name=table_name)
-        node.query(sql)
+    node.query(sql)
 
 
 def drop_distributed_table(node, table_name):
@@ -107,7 +105,7 @@ def drop_distributed_table(node, table_name):
 
 
 def insert(node, table_name, chunk=1000, col_names=None, iterations=1, ignore_exception=False,
-        slow=False, with_many_parts=False, offset=0, with_time_column=False):
+           slow=False, with_many_parts=False, offset=0, with_time_column=False):
     if col_names is None:
         col_names = ['num', 'num2']
     for i in range(iterations):
@@ -118,28 +116,32 @@ def insert(node, table_name, chunk=1000, col_names=None, iterations=1, ignore_ex
             if with_time_column:
                 query.append(
                     "INSERT INTO {table_name} ({col0}, {col1}, time) SELECT number AS {col0}, number + 1 AS {col1}, now() + 10 AS time FROM numbers_mt({chunk})"
-                .format(table_name=table_name, chunk=chunk, col0=col_names[0], col1=col_names[1]))
+                        .format(table_name=table_name, chunk=chunk, col0=col_names[0], col1=col_names[1]))
             elif slow:
                 query.append(
                     "INSERT INTO {table_name} ({col0}, {col1}) SELECT number + sleepEachRow(0.001) AS {col0}, number + 1 AS {col1} FROM numbers_mt({chunk})"
-                .format(table_name=table_name, chunk=chunk, col0=col_names[0], col1=col_names[1]))
+                        .format(table_name=table_name, chunk=chunk, col0=col_names[0], col1=col_names[1]))
             else:
                 query.append(
                     "INSERT INTO {table_name} ({col0},{col1}) SELECT number + {offset} AS {col0}, number + 1 + {offset} AS {col1} FROM numbers_mt({chunk})"
-                .format(table_name=table_name, chunk=chunk, col0=col_names[0], col1=col_names[1], offset=str(offset)))
+                        .format(table_name=table_name, chunk=chunk, col0=col_names[0], col1=col_names[1],
+                                offset=str(offset)))
             node.query(";\n".join(query))
         except QueryRuntimeException as ex:
             if not ignore_exception:
                 raise
 
 
-def select(node, table_name, col_name="num", expected_result=None, iterations=1, ignore_exception=False, slow=False, poll=None):
+def select(node, table_name, col_name="num", expected_result=None, iterations=1, ignore_exception=False, slow=False,
+           poll=None):
     for i in range(iterations):
         start_time = time.time()
         while True:
             try:
                 if slow:
-                    r = node.query("SELECT count() FROM (SELECT num2, sleepEachRow(0.5) FROM {} WHERE {} % 1000 > 0)".format(table_name, col_name))
+                    r = node.query(
+                        "SELECT count() FROM (SELECT num2, sleepEachRow(0.5) FROM {} WHERE {} % 1000 > 0)".format(
+                            table_name, col_name))
                 else:
                     r = node.query("SELECT count() FROM {} WHERE {} % 1000 > 0".format(table_name, col_name))
                 if expected_result:
@@ -180,7 +182,7 @@ def alter_move(node, table_name, iterations=1, ignore_exception=False):
         move_volume = 'external'
         try:
             node.query("ALTER TABLE {table_name} MOVE PARTITION '{move_part}' TO VOLUME '{move_volume}'"
-                .format(table_name=table_name, move_part=move_part, move_volume=move_volume))
+                       .format(table_name=table_name, move_part=move_part, move_volume=move_volume))
         except QueryRuntimeException as ex:
             if not ignore_exception:
                 raise
@@ -306,7 +308,7 @@ def test_rename_with_parallel_merges(started_cluster):
     try:
         create_table(nodes, table_name)
         for i in range(20):
-            insert(node1, table_name, 100, ["num","num2"], 1, False, False, True, offset=i*100)
+            insert(node1, table_name, 100, ["num", "num2"], 1, False, False, True, offset=i * 100)
 
         def merge_parts(node, table_name, iterations=1):
             for i in range(iterations):
@@ -347,7 +349,7 @@ def test_rename_with_parallel_slow_insert(started_cluster):
         p = Pool(15)
         tasks = []
         tasks.append(p.apply_async(insert, (node1, table_name, 10000, ["num", "num2"], 1, False, True)))
-        tasks.append(p.apply_async(insert, (node1, table_name, 10000, ["num", "num2"], 1, True, True))) # deduplicated
+        tasks.append(p.apply_async(insert, (node1, table_name, 10000, ["num", "num2"], 1, True, True)))  # deduplicated
         time.sleep(0.5)
         tasks.append(p.apply_async(rename_column, (node1, table_name, "num2", "foo2")))
 
@@ -451,7 +453,9 @@ def test_rename_with_parallel_ttl_move(started_cluster):
             task.get(timeout=240)
 
         # check some parts got moved
-        assert "external" in set(node1.query("SELECT disk_name FROM system.parts WHERE table == '{}' AND active=1 ORDER BY modification_time".format(table_name)).strip().splitlines())
+        assert "external" in set(node1.query(
+            "SELECT disk_name FROM system.parts WHERE table == '{}' AND active=1 ORDER BY modification_time".format(
+                table_name)).strip().splitlines())
 
         # rename column back to original
         rename_column(node1, table_name, "foo2", "num2", 1, True)
@@ -507,7 +511,7 @@ def test_rename_distributed(started_cluster):
         rename_column_on_cluster(node1, table_name, 'num2', 'foo2')
         rename_column_on_cluster(node1, '%s_replicated' % table_name, 'num2', 'foo2')
 
-        insert(node1, table_name, 1000, col_names=['num','foo2'])
+        insert(node1, table_name, 1000, col_names=['num', 'foo2'])
 
         select(node1, table_name, "foo2", '1998\n', poll=30)
     finally:
@@ -524,11 +528,14 @@ def test_rename_distributed_parallel_insert_and_select(started_cluster):
         tasks = []
         for i in range(1):
             tasks.append(p.apply_async(rename_column_on_cluster, (node1, table_name, 'num2', 'foo2', 3, True)))
-            tasks.append(p.apply_async(rename_column_on_cluster, (node1, '%s_replicated' % table_name, 'num2', 'foo2', 3, True)))
+            tasks.append(
+                p.apply_async(rename_column_on_cluster, (node1, '%s_replicated' % table_name, 'num2', 'foo2', 3, True)))
             tasks.append(p.apply_async(rename_column_on_cluster, (node1, table_name, 'foo2', 'foo3', 3, True)))
-            tasks.append(p.apply_async(rename_column_on_cluster, (node1, '%s_replicated' % table_name, 'foo2', 'foo3', 3, True)))
+            tasks.append(
+                p.apply_async(rename_column_on_cluster, (node1, '%s_replicated' % table_name, 'foo2', 'foo3', 3, True)))
             tasks.append(p.apply_async(rename_column_on_cluster, (node1, table_name, 'foo3', 'num2', 3, True)))
-            tasks.append(p.apply_async(rename_column_on_cluster, (node1, '%s_replicated' % table_name, 'foo3', 'num2', 3, True)))
+            tasks.append(
+                p.apply_async(rename_column_on_cluster, (node1, '%s_replicated' % table_name, 'foo3', 'num2', 3, True)))
             tasks.append(p.apply_async(insert, (node1, table_name, 10, ["num", "foo3"], 5, True)))
             tasks.append(p.apply_async(insert, (node2, table_name, 10, ["num", "num2"], 5, True)))
             tasks.append(p.apply_async(insert, (node3, table_name, 10, ["num", "foo2"], 5, True)))
@@ -543,7 +550,7 @@ def test_rename_distributed_parallel_insert_and_select(started_cluster):
         rename_column_on_cluster(node1, table_name, 'foo3', 'num2', 1, True)
         rename_column_on_cluster(node1, '%s_replicated' % table_name, 'foo3', 'num2', 1, True)
 
-        insert(node1, table_name, 1000, col_names=['num','num2'])
+        insert(node1, table_name, 1000, col_names=['num', 'num2'])
         select(node1, table_name, "num2")
         select(node2, table_name, "num2")
         select(node3, table_name, "num2")
diff --git a/tests/integration/test_replace_partition/test.py b/tests/integration/test_replace_partition/test.py
index c771ed4c874..06e7f4be82b 100644
--- a/tests/integration/test_replace_partition/test.py
+++ b/tests/integration/test_replace_partition/test.py
@@ -1,6 +1,4 @@
 import pytest
-import time
-import sys
 
 from helpers.cluster import ClickHouseCluster
 from helpers.network import PartitionManager
@@ -9,26 +7,28 @@ from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
+
 def _fill_nodes(nodes, shard):
     for node in nodes:
         node.query(
-        '''
-            CREATE DATABASE test;
-
-            CREATE TABLE real_table(date Date, id UInt32, dummy UInt32)
-            ENGINE = MergeTree(date, id, 8192);
-
-            CREATE TABLE other_table(date Date, id UInt32, dummy UInt32)
-            ENGINE = MergeTree(date, id, 8192);
-
-            CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}', date, id, 8192);
-        '''.format(shard=shard, replica=node.name))
+            '''
+                CREATE DATABASE test;
+    
+                CREATE TABLE real_table(date Date, id UInt32, dummy UInt32)
+                ENGINE = MergeTree(date, id, 8192);
+    
+                CREATE TABLE other_table(date Date, id UInt32, dummy UInt32)
+                ENGINE = MergeTree(date, id, 8192);
+    
+                CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}', date, id, 8192);
+            '''.format(shard=shard, replica=node.name))
 
 
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def normal_work():
     try:
@@ -41,6 +41,7 @@ def normal_work():
     finally:
         cluster.shutdown()
 
+
 def test_normal_work(normal_work):
     node1.query("insert into test_table values ('2017-06-16', 111, 0)")
     node1.query("insert into real_table values ('2017-06-16', 222, 0)")
@@ -54,9 +55,11 @@ def test_normal_work(normal_work):
     assert_eq_with_retry(node1, "SELECT id FROM test_table order by id", '222')
     assert_eq_with_retry(node2, "SELECT id FROM test_table order by id", '222')
 
+
 node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def drop_failover():
     try:
@@ -69,6 +72,7 @@ def drop_failover():
     finally:
         cluster.shutdown()
 
+
 def test_drop_failover(drop_failover):
     node3.query("insert into test_table values ('2017-06-16', 111, 0)")
     node3.query("insert into real_table values ('2017-06-16', 222, 0)")
@@ -77,7 +81,6 @@ def test_drop_failover(drop_failover):
     assert_eq_with_retry(node3, "SELECT id FROM real_table order by id", '222')
     assert_eq_with_retry(node4, "SELECT id FROM test_table order by id", '111')
 
-
     with PartitionManager() as pm:
         # Hinder replication between replicas
         pm.partition_instances(node3, node4, port=9009)
@@ -91,18 +94,22 @@ def test_drop_failover(drop_failover):
         # Network interrupted -- replace is not ok, but it's ok
         assert_eq_with_retry(node4, "SELECT id FROM test_table order by id", '111')
 
-        #Drop partition on source node
+        # Drop partition on source node
         node3.query("ALTER TABLE test_table DROP PARTITION 201706")
 
     # connection restored
 
-    node4.query_with_retry("select last_exception from system.replication_queue where type = 'REPLACE_RANGE'", check_callback=lambda x: 'Not found part' not in x, sleep_time=1)
-    assert 'Not found part' not in node4.query("select last_exception from system.replication_queue where type = 'REPLACE_RANGE'")
+    node4.query_with_retry("select last_exception from system.replication_queue where type = 'REPLACE_RANGE'",
+                           check_callback=lambda x: 'Not found part' not in x, sleep_time=1)
+    assert 'Not found part' not in node4.query(
+        "select last_exception from system.replication_queue where type = 'REPLACE_RANGE'")
     assert_eq_with_retry(node4, "SELECT id FROM test_table order by id", '')
 
+
 node5 = cluster.add_instance('node5', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 node6 = cluster.add_instance('node6', main_configs=['configs/remote_servers.xml'], with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def replace_after_replace_failover():
     try:
@@ -115,6 +122,7 @@ def replace_after_replace_failover():
     finally:
         cluster.shutdown()
 
+
 def test_replace_after_replace_failover(replace_after_replace_failover):
     node5.query("insert into test_table values ('2017-06-16', 111, 0)")
     node5.query("insert into real_table values ('2017-06-16', 222, 0)")
@@ -125,7 +133,6 @@ def test_replace_after_replace_failover(replace_after_replace_failover):
     assert_eq_with_retry(node5, "SELECT id FROM other_table order by id", '333')
     assert_eq_with_retry(node6, "SELECT id FROM test_table order by id", '111')
 
-
     with PartitionManager() as pm:
         # Hinder replication between replicas
         pm.partition_instances(node5, node6, port=9009)
@@ -139,11 +146,13 @@ def test_replace_after_replace_failover(replace_after_replace_failover):
         # Network interrupted -- replace is not ok, but it's ok
         assert_eq_with_retry(node6, "SELECT id FROM test_table order by id", '111')
 
-        #Replace partition on source node
+        # Replace partition on source node
         node5.query("ALTER TABLE test_table REPLACE PARTITION 201706 FROM other_table")
 
         assert_eq_with_retry(node5, "SELECT id FROM test_table order by id", '333')
 
-    node6.query_with_retry("select last_exception from system.replication_queue where type = 'REPLACE_RANGE'", check_callback=lambda x: 'Not found part' not in x, sleep_time=1)
-    assert 'Not found part' not in node6.query("select last_exception from system.replication_queue where type = 'REPLACE_RANGE'")
+    node6.query_with_retry("select last_exception from system.replication_queue where type = 'REPLACE_RANGE'",
+                           check_callback=lambda x: 'Not found part' not in x, sleep_time=1)
+    assert 'Not found part' not in node6.query(
+        "select last_exception from system.replication_queue where type = 'REPLACE_RANGE'")
     assert_eq_with_retry(node6, "SELECT id FROM test_table order by id", '333')
diff --git a/tests/integration/test_replica_can_become_leader/test.py b/tests/integration/test_replica_can_become_leader/test.py
index 2ef518d5570..fae4fa28226 100644
--- a/tests/integration/test_replica_can_become_leader/test.py
+++ b/tests/integration/test_replica_can_become_leader/test.py
@@ -1,13 +1,13 @@
 import pytest
-
-from helpers.cluster import ClickHouseCluster
 from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/notleader.xml'], with_zookeeper=True)
 node2 = cluster.add_instance('node2', main_configs=['configs/notleaderignorecase.xml'], with_zookeeper=True)
 node3 = cluster.add_instance('node3', with_zookeeper=True)
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
diff --git a/tests/integration/test_replicated_merge_tree_s3/test.py b/tests/integration/test_replicated_merge_tree_s3/test.py
index a77a69b842b..de6f5e9f868 100644
--- a/tests/integration/test_replicated_merge_tree_s3/test.py
+++ b/tests/integration/test_replicated_merge_tree_s3/test.py
@@ -1,7 +1,6 @@
 import logging
 import random
 import string
-import time
 
 import pytest
 from helpers.cluster import ClickHouseCluster
@@ -15,9 +14,12 @@ def cluster():
     try:
         cluster = ClickHouseCluster(__file__)
 
-        cluster.add_instance("node1", main_configs=["configs/config.d/storage_conf.xml"], macros={'cluster': 'test1'}, with_minio=True, with_zookeeper=True)
-        cluster.add_instance("node2", main_configs=["configs/config.d/storage_conf.xml"], macros={'cluster': 'test1'}, with_zookeeper=True)
-        cluster.add_instance("node3", main_configs=["configs/config.d/storage_conf.xml"], macros={'cluster': 'test1'}, with_zookeeper=True)
+        cluster.add_instance("node1", main_configs=["configs/config.d/storage_conf.xml"], macros={'cluster': 'test1'},
+                             with_minio=True, with_zookeeper=True)
+        cluster.add_instance("node2", main_configs=["configs/config.d/storage_conf.xml"], macros={'cluster': 'test1'},
+                             with_zookeeper=True)
+        cluster.add_instance("node3", main_configs=["configs/config.d/storage_conf.xml"], macros={'cluster': 'test1'},
+                             with_zookeeper=True)
 
         logging.info("Starting cluster...")
         cluster.start()
@@ -39,7 +41,7 @@ def random_string(length):
 
 
 def generate_values(date_str, count, sign=1):
-    data = [[date_str, sign*(i + 1), random_string(10)] for i in range(count)]
+    data = [[date_str, sign * (i + 1), random_string(10)] for i in range(count)]
     data.sort(key=lambda tup: tup[1])
     return ",".join(["('{}',{},'{}')".format(x, y, z) for x, y, z in data])
 
@@ -87,7 +89,9 @@ def test_insert_select_replicated(cluster):
 
     for node_idx in range(1, 4):
         node = cluster.instances["node" + str(node_idx)]
-        assert node.query("SELECT * FROM s3_test order by dt, id FORMAT Values", settings={"select_sequential_consistency": 1}) == all_values
+        assert node.query("SELECT * FROM s3_test order by dt, id FORMAT Values",
+                          settings={"select_sequential_consistency": 1}) == all_values
 
     minio = cluster.minio_client
-    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == 3 * (FILES_OVERHEAD + FILES_OVERHEAD_PER_PART * 3)
+    assert len(list(minio.list_objects(cluster.minio_bucket, 'data/'))) == 3 * (
+            FILES_OVERHEAD + FILES_OVERHEAD_PER_PART * 3)
diff --git a/tests/integration/test_replicated_mutations/test.py b/tests/integration/test_replicated_mutations/test.py
index 0347ba4782c..cf3cef3a9e6 100644
--- a/tests/integration/test_replicated_mutations/test.py
+++ b/tests/integration/test_replicated_mutations/test.py
@@ -1,26 +1,28 @@
-import time
-import threading
 import random
+import threading
+import time
 from collections import Counter
 
 import pytest
-
 from helpers.cluster import ClickHouseCluster
 
-
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1', macros={'cluster': 'test1'}, with_zookeeper=True)
 # Check, that limits on max part size for merges doesn`t affect mutations
-node2 = cluster.add_instance('node2', macros={'cluster': 'test1'}, main_configs=["configs/merge_tree.xml"], with_zookeeper=True)
+node2 = cluster.add_instance('node2', macros={'cluster': 'test1'}, main_configs=["configs/merge_tree.xml"],
+                             with_zookeeper=True)
 
-node3 = cluster.add_instance('node3', macros={'cluster': 'test2'}, main_configs=["configs/merge_tree_max_parts.xml"], with_zookeeper=True)
-node4 = cluster.add_instance('node4', macros={'cluster': 'test2'}, main_configs=["configs/merge_tree_max_parts.xml"], with_zookeeper=True)
+node3 = cluster.add_instance('node3', macros={'cluster': 'test2'}, main_configs=["configs/merge_tree_max_parts.xml"],
+                             with_zookeeper=True)
+node4 = cluster.add_instance('node4', macros={'cluster': 'test2'}, main_configs=["configs/merge_tree_max_parts.xml"],
+                             with_zookeeper=True)
 
 node5 = cluster.add_instance('node5', macros={'cluster': 'test3'}, main_configs=["configs/merge_tree_max_parts.xml"])
 
 all_nodes = [node1, node2, node3, node4, node5]
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -30,9 +32,11 @@ def started_cluster():
             node.query("DROP TABLE IF EXISTS test_mutations")
 
         for node in [node1, node2, node3, node4]:
-            node.query("CREATE TABLE test_mutations(d Date, x UInt32, i UInt32) ENGINE ReplicatedMergeTree('/clickhouse/{cluster}/tables/test/test_mutations', '{instance}') ORDER BY x PARTITION BY toYYYYMM(d)")
+            node.query(
+                "CREATE TABLE test_mutations(d Date, x UInt32, i UInt32) ENGINE ReplicatedMergeTree('/clickhouse/{cluster}/tables/test/test_mutations', '{instance}') ORDER BY x PARTITION BY toYYYYMM(d)")
 
-        node5.query("CREATE TABLE test_mutations(d Date, x UInt32, i UInt32) ENGINE MergeTree() ORDER BY x PARTITION BY toYYYYMM(d)")
+        node5.query(
+            "CREATE TABLE test_mutations(d Date, x UInt32, i UInt32) ENGINE MergeTree() ORDER BY x PARTITION BY toYYYYMM(d)")
 
         yield cluster
 
@@ -184,7 +188,8 @@ def test_mutations(started_cluster):
 
     print "Total mutations: ", runner.total_mutations
     for node in nodes:
-        print node.query("SELECT mutation_id, command, parts_to_do, is_done FROM system.mutations WHERE table = 'test_mutations' FORMAT TSVWithNames")
+        print node.query(
+            "SELECT mutation_id, command, parts_to_do, is_done FROM system.mutations WHERE table = 'test_mutations' FORMAT TSVWithNames")
     assert all_done
 
     expected_sum = runner.total_inserted_xs - runner.total_deleted_xs
@@ -195,10 +200,10 @@ def test_mutations(started_cluster):
 
 
 @pytest.mark.parametrize(
-    ('nodes', ),
+    ('nodes',),
     [
-        ([node5, ], ),          # MergeTree
-        ([node3, node4], ),     # ReplicatedMergeTree
+        ([node5, ],),  # MergeTree
+        ([node3, node4],),  # ReplicatedMergeTree
     ]
 )
 def test_mutations_dont_prevent_merges(started_cluster, nodes):
@@ -228,8 +233,10 @@ def test_mutations_dont_prevent_merges(started_cluster, nodes):
         t.join()
 
     for node in nodes:
-        print node.query("SELECT mutation_id, command, parts_to_do, is_done FROM system.mutations WHERE table = 'test_mutations' FORMAT TSVWithNames")
-        print node.query("SELECT partition, count(name), sum(active), sum(active*rows) FROM system.parts WHERE table ='test_mutations' GROUP BY partition FORMAT TSVWithNames")
+        print node.query(
+            "SELECT mutation_id, command, parts_to_do, is_done FROM system.mutations WHERE table = 'test_mutations' FORMAT TSVWithNames")
+        print node.query(
+            "SELECT partition, count(name), sum(active), sum(active*rows) FROM system.parts WHERE table ='test_mutations' GROUP BY partition FORMAT TSVWithNames")
 
     assert all_done
     assert all([str(e).find("Too many parts") < 0 for e in runner.exceptions])
diff --git a/tests/integration/test_replicated_parse_zk_metadata/test.py b/tests/integration/test_replicated_parse_zk_metadata/test.py
index dc8eb0129cc..4bdd77393b3 100644
--- a/tests/integration/test_replicated_parse_zk_metadata/test.py
+++ b/tests/integration/test_replicated_parse_zk_metadata/test.py
@@ -5,6 +5,7 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', with_zookeeper=True)
 
+
 @pytest.fixture(scope='module', autouse=True)
 def started_cluster():
     try:
@@ -13,17 +14,18 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_replicated_engine_parse_metadata_on_attach():
     node.query(
-    '''
-    CREATE TABLE data (
-        key Int,
-        INDEX key_idx0 key+0 TYPE minmax GRANULARITY 1,
-        INDEX key_idx1 key+1 TYPE minmax GRANULARITY 1
-    )
-    ENGINE = ReplicatedMergeTree('/ch/tables/default/data', 'node')
-    ORDER BY key;
-    ''')
+        '''
+        CREATE TABLE data (
+            key Int,
+            INDEX key_idx0 key+0 TYPE minmax GRANULARITY 1,
+            INDEX key_idx1 key+1 TYPE minmax GRANULARITY 1
+        )
+        ENGINE = ReplicatedMergeTree('/ch/tables/default/data', 'node')
+        ORDER BY key;
+        ''')
     node.query('DETACH TABLE data')
 
     zk = cluster.get_kazoo_client('zoo1')
diff --git a/tests/integration/test_replicating_constants/test.py b/tests/integration/test_replicating_constants/test.py
index b72b9089f65..13a605f2650 100644
--- a/tests/integration/test_replicating_constants/test.py
+++ b/tests/integration/test_replicating_constants/test.py
@@ -5,7 +5,9 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1', with_zookeeper=True)
-node2 = cluster.add_instance('node2', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.14', with_installed_binary=True)
+node2 = cluster.add_instance('node2', with_zookeeper=True, image='yandex/clickhouse-server', tag='19.1.14',
+                             with_installed_binary=True)
+
 
 @pytest.fixture(scope="module")
 def start_cluster():
@@ -16,6 +18,6 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
-def test_different_versions(start_cluster):
 
+def test_different_versions(start_cluster):
     assert node1.query("SELECT uniqExact(x) FROM (SELECT version() as x from remote('node{1,2}', system.one))") == "2\n"
diff --git a/tests/integration/test_replication_credentials/test.py b/tests/integration/test_replication_credentials/test.py
index ad5f05e04d9..4f07d6966a6 100644
--- a/tests/integration/test_replication_credentials/test.py
+++ b/tests/integration/test_replication_credentials/test.py
@@ -1,22 +1,25 @@
 import time
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 
 def _fill_nodes(nodes, shard):
     for node in nodes:
         node.query(
-        '''
-            CREATE DATABASE test;
+            '''
+                CREATE DATABASE test;
+    
+                CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}', date, id, 8192);
+            '''.format(shard=shard, replica=node.name))
 
-            CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}', date, id, 8192);
-        '''.format(shard=shard, replica=node.name))
 
 cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml', 'configs/credentials1.xml'], with_zookeeper=True)
-node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml', 'configs/credentials1.xml'], with_zookeeper=True)
+node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml', 'configs/credentials1.xml'],
+                             with_zookeeper=True)
+node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml', 'configs/credentials1.xml'],
+                             with_zookeeper=True)
 
 
 @pytest.fixture(scope="module")
@@ -31,6 +34,7 @@ def same_credentials_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_same_credentials(same_credentials_cluster):
     node1.query("insert into test_table values ('2017-06-16', 111, 0)")
     time.sleep(1)
@@ -45,8 +49,11 @@ def test_same_credentials(same_credentials_cluster):
     assert node2.query("SELECT id FROM test_table order by id") == '111\n222\n'
 
 
-node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml', 'configs/no_credentials.xml'], with_zookeeper=True)
-node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml', 'configs/no_credentials.xml'], with_zookeeper=True)
+node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml', 'configs/no_credentials.xml'],
+                             with_zookeeper=True)
+node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml', 'configs/no_credentials.xml'],
+                             with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def no_credentials_cluster():
@@ -74,8 +81,12 @@ def test_no_credentials(no_credentials_cluster):
     assert node3.query("SELECT id FROM test_table order by id") == '111\n222\n'
     assert node4.query("SELECT id FROM test_table order by id") == '111\n222\n'
 
-node5 = cluster.add_instance('node5', main_configs=['configs/remote_servers.xml', 'configs/credentials1.xml'], with_zookeeper=True)
-node6 = cluster.add_instance('node6', main_configs=['configs/remote_servers.xml', 'configs/credentials2.xml'], with_zookeeper=True)
+
+node5 = cluster.add_instance('node5', main_configs=['configs/remote_servers.xml', 'configs/credentials1.xml'],
+                             with_zookeeper=True)
+node6 = cluster.add_instance('node6', main_configs=['configs/remote_servers.xml', 'configs/credentials2.xml'],
+                             with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def different_credentials_cluster():
@@ -89,6 +100,7 @@ def different_credentials_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_different_credentials(different_credentials_cluster):
     node5.query("insert into test_table values ('2017-06-20', 111, 0)")
     time.sleep(1)
@@ -102,8 +114,12 @@ def test_different_credentials(different_credentials_cluster):
     assert node5.query("SELECT id FROM test_table order by id") == '111\n'
     assert node6.query("SELECT id FROM test_table order by id") == '222\n'
 
-node7 = cluster.add_instance('node7', main_configs=['configs/remote_servers.xml', 'configs/credentials1.xml'], with_zookeeper=True)
-node8 = cluster.add_instance('node8', main_configs=['configs/remote_servers.xml', 'configs/no_credentials.xml'], with_zookeeper=True)
+
+node7 = cluster.add_instance('node7', main_configs=['configs/remote_servers.xml', 'configs/credentials1.xml'],
+                             with_zookeeper=True)
+node8 = cluster.add_instance('node8', main_configs=['configs/remote_servers.xml', 'configs/no_credentials.xml'],
+                             with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def credentials_and_no_credentials_cluster():
@@ -117,6 +133,7 @@ def credentials_and_no_credentials_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_credentials_and_no_credentials(credentials_and_no_credentials_cluster):
     node7.query("insert into test_table values ('2017-06-21', 111, 0)")
     time.sleep(1)
@@ -129,4 +146,3 @@ def test_credentials_and_no_credentials(credentials_and_no_credentials_cluster):
 
     assert node7.query("SELECT id FROM test_table order by id") == '111\n'
     assert node8.query("SELECT id FROM test_table order by id") == '222\n'
-
diff --git a/tests/integration/test_replication_without_zookeeper/test.py b/tests/integration/test_replication_without_zookeeper/test.py
index 45c7f10acd6..90f060d991a 100644
--- a/tests/integration/test_replication_without_zookeeper/test.py
+++ b/tests/integration/test_replication_without_zookeeper/test.py
@@ -1,8 +1,7 @@
 import time
-import pytest
 
+import pytest
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], with_zookeeper=True, stay_alive=True)
@@ -50,4 +49,3 @@ def test_startup_without_zookeeper(start_cluster):
 
     assert node1.query("SELECT COUNT(*) from test_table") == "3\n"
     assert node1.query("SELECT is_readonly from system.replicas where table='test_table'") == "1\n"
-
diff --git a/tests/integration/test_role/test.py b/tests/integration/test_role/test.py
index 667347be017..31fddd3df8c 100644
--- a/tests/integration/test_role/test.py
+++ b/tests/integration/test_role/test.py
@@ -1,7 +1,6 @@
 import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
-import re
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance')
@@ -11,7 +10,7 @@ instance = cluster.add_instance('instance')
 def started_cluster():
     try:
         cluster.start()
-        
+
         instance.query("CREATE TABLE test_table(x UInt32, y UInt32) ENGINE = MergeTree ORDER BY tuple()")
         instance.query("INSERT INTO test_table VALUES (1,5), (2,10)")
 
@@ -35,7 +34,7 @@ def test_create_role():
     instance.query('CREATE ROLE R1')
 
     assert "Not enough privileges" in instance.query_and_get_error("SELECT * FROM test_table", user='A')
-    
+
     instance.query('GRANT SELECT ON test_table TO R1')
     assert "Not enough privileges" in instance.query_and_get_error("SELECT * FROM test_table", user='A')
 
@@ -52,13 +51,13 @@ def test_grant_role_to_role():
     instance.query('CREATE ROLE R2')
 
     assert "Not enough privileges" in instance.query_and_get_error("SELECT * FROM test_table", user='A')
-    
+
     instance.query('GRANT R1 TO A')
     assert "Not enough privileges" in instance.query_and_get_error("SELECT * FROM test_table", user='A')
-    
+
     instance.query('GRANT R2 TO R1')
     assert "Not enough privileges" in instance.query_and_get_error("SELECT * FROM test_table", user='A')
-    
+
     instance.query('GRANT SELECT ON test_table TO R2')
     assert instance.query("SELECT * FROM test_table", user='A') == "1\t5\n2\t10\n"
 
@@ -69,12 +68,12 @@ def test_combine_privileges():
     instance.query('CREATE ROLE R2')
 
     assert "Not enough privileges" in instance.query_and_get_error("SELECT * FROM test_table", user='A')
-    
+
     instance.query('GRANT R1 TO A')
     instance.query('GRANT SELECT(x) ON test_table TO R1')
     assert "Not enough privileges" in instance.query_and_get_error("SELECT * FROM test_table", user='A')
     assert instance.query("SELECT x FROM test_table", user='A') == "1\n2\n"
-    
+
     instance.query('GRANT SELECT(y) ON test_table TO R2')
     instance.query('GRANT R2 TO A')
     assert instance.query("SELECT * FROM test_table", user='A') == "1\t5\n2\t10\n"
@@ -100,7 +99,7 @@ def test_admin_option():
 def test_revoke_requires_admin_option():
     instance.query("CREATE USER A, B")
     instance.query("CREATE ROLE R1, R2")
-    
+
     instance.query("GRANT R1 TO B")
     assert instance.query("SHOW GRANTS FOR B") == "GRANT R1 TO B\n"
 
@@ -150,25 +149,28 @@ def test_introspection():
     instance.query('GRANT CREATE ON *.* TO B WITH GRANT OPTION')
     instance.query('REVOKE SELECT(x) ON test.table FROM R2')
 
-    assert instance.query("SHOW ROLES") == TSV([ "R1", "R2" ])
-    assert instance.query("SHOW CREATE ROLE R1") == TSV([ "CREATE ROLE R1" ])
-    assert instance.query("SHOW CREATE ROLE R2") == TSV([ "CREATE ROLE R2" ])
-    assert instance.query("SHOW CREATE ROLES R1, R2") == TSV([ "CREATE ROLE R1", "CREATE ROLE R2" ])
-    assert instance.query("SHOW CREATE ROLES") == TSV([ "CREATE ROLE R1", "CREATE ROLE R2" ])
+    assert instance.query("SHOW ROLES") == TSV(["R1", "R2"])
+    assert instance.query("SHOW CREATE ROLE R1") == TSV(["CREATE ROLE R1"])
+    assert instance.query("SHOW CREATE ROLE R2") == TSV(["CREATE ROLE R2"])
+    assert instance.query("SHOW CREATE ROLES R1, R2") == TSV(["CREATE ROLE R1", "CREATE ROLE R2"])
+    assert instance.query("SHOW CREATE ROLES") == TSV(["CREATE ROLE R1", "CREATE ROLE R2"])
 
-    assert instance.query("SHOW GRANTS FOR A") == TSV([ "GRANT SELECT ON test.table TO A", "GRANT R1 TO A" ])
-    assert instance.query("SHOW GRANTS FOR B") == TSV([ "GRANT CREATE ON *.* TO B WITH GRANT OPTION", "GRANT R2 TO B WITH ADMIN OPTION" ])
+    assert instance.query("SHOW GRANTS FOR A") == TSV(["GRANT SELECT ON test.table TO A", "GRANT R1 TO A"])
+    assert instance.query("SHOW GRANTS FOR B") == TSV(
+        ["GRANT CREATE ON *.* TO B WITH GRANT OPTION", "GRANT R2 TO B WITH ADMIN OPTION"])
     assert instance.query("SHOW GRANTS FOR R1") == ""
-    assert instance.query("SHOW GRANTS FOR R2") == TSV([ "GRANT SELECT ON test.table TO R2", "REVOKE SELECT(x) ON test.table FROM R2" ])
+    assert instance.query("SHOW GRANTS FOR R2") == TSV(
+        ["GRANT SELECT ON test.table TO R2", "REVOKE SELECT(x) ON test.table FROM R2"])
 
-    assert instance.query("SHOW GRANTS", user='A') == TSV([ "GRANT SELECT ON test.table TO A", "GRANT R1 TO A" ])
-    assert instance.query("SHOW GRANTS", user='B') == TSV([ "GRANT CREATE ON *.* TO B WITH GRANT OPTION", "GRANT R2 TO B WITH ADMIN OPTION" ])
-    assert instance.query("SHOW CURRENT ROLES", user='A') == TSV([[ "R1", 0, 1 ]])
-    assert instance.query("SHOW CURRENT ROLES", user='B') == TSV([[ "R2", 1, 1 ]])
-    assert instance.query("SHOW ENABLED ROLES", user='A') == TSV([[ "R1", 0, 1, 1 ]])
-    assert instance.query("SHOW ENABLED ROLES", user='B') == TSV([[ "R2", 1, 1, 1 ]])
+    assert instance.query("SHOW GRANTS", user='A') == TSV(["GRANT SELECT ON test.table TO A", "GRANT R1 TO A"])
+    assert instance.query("SHOW GRANTS", user='B') == TSV(
+        ["GRANT CREATE ON *.* TO B WITH GRANT OPTION", "GRANT R2 TO B WITH ADMIN OPTION"])
+    assert instance.query("SHOW CURRENT ROLES", user='A') == TSV([["R1", 0, 1]])
+    assert instance.query("SHOW CURRENT ROLES", user='B') == TSV([["R2", 1, 1]])
+    assert instance.query("SHOW ENABLED ROLES", user='A') == TSV([["R1", 0, 1, 1]])
+    assert instance.query("SHOW ENABLED ROLES", user='B') == TSV([["R2", 1, 1, 1]])
 
-    expected_access1 = "CREATE ROLE R1\n"\
+    expected_access1 = "CREATE ROLE R1\n" \
                        "CREATE ROLE R2\n"
     expected_access2 = "GRANT R1 TO A\n"
     expected_access3 = "GRANT R2 TO B WITH ADMIN OPTION"
@@ -176,21 +178,23 @@ def test_introspection():
     assert expected_access2 in instance.query("SHOW ACCESS")
     assert expected_access3 in instance.query("SHOW ACCESS")
 
-    assert instance.query("SELECT name, storage from system.roles WHERE name IN ('R1', 'R2') ORDER BY name") ==\
-           TSV([[ "R1", "local directory" ],
-                [ "R2", "local directory" ]])
+    assert instance.query("SELECT name, storage from system.roles WHERE name IN ('R1', 'R2') ORDER BY name") == \
+           TSV([["R1", "local directory"],
+                ["R2", "local directory"]])
 
-    assert instance.query("SELECT * from system.grants WHERE user_name IN ('A', 'B') OR role_name IN ('R1', 'R2') ORDER BY user_name, role_name, access_type, grant_option") ==\
-           TSV([[ "A",  "\N", "SELECT", "test", "table", "\N", 0, 0 ],
-                [ "B",  "\N", "CREATE", "\N",   "\N",    "\N", 0, 1 ],
-                [ "\N", "R2", "SELECT", "test", "table", "\N", 0, 0 ],
-                [ "\N", "R2", "SELECT", "test", "table", "x",  1, 0 ]])
+    assert instance.query(
+        "SELECT * from system.grants WHERE user_name IN ('A', 'B') OR role_name IN ('R1', 'R2') ORDER BY user_name, role_name, access_type, grant_option") == \
+           TSV([["A", "\N", "SELECT", "test", "table", "\N", 0, 0],
+                ["B", "\N", "CREATE", "\N", "\N", "\N", 0, 1],
+                ["\N", "R2", "SELECT", "test", "table", "\N", 0, 0],
+                ["\N", "R2", "SELECT", "test", "table", "x", 1, 0]])
 
-    assert instance.query("SELECT * from system.role_grants WHERE user_name IN ('A', 'B') OR role_name IN ('R1', 'R2') ORDER BY user_name, role_name, granted_role_name") ==\
-           TSV([[ "A", "\N", "R1", 1, 0 ],
-                [ "B", "\N", "R2", 1, 1 ]])
+    assert instance.query(
+        "SELECT * from system.role_grants WHERE user_name IN ('A', 'B') OR role_name IN ('R1', 'R2') ORDER BY user_name, role_name, granted_role_name") == \
+           TSV([["A", "\N", "R1", 1, 0],
+                ["B", "\N", "R2", 1, 1]])
 
-    assert instance.query("SELECT * from system.current_roles ORDER BY role_name", user='A') == TSV([[ "R1", 0, 1 ]])
-    assert instance.query("SELECT * from system.current_roles ORDER BY role_name", user='B') == TSV([[ "R2", 1, 1 ]])
-    assert instance.query("SELECT * from system.enabled_roles ORDER BY role_name", user='A') == TSV([[ "R1", 0, 1, 1 ]])
-    assert instance.query("SELECT * from system.enabled_roles ORDER BY role_name", user='B') == TSV([[ "R2", 1, 1, 1 ]])
+    assert instance.query("SELECT * from system.current_roles ORDER BY role_name", user='A') == TSV([["R1", 0, 1]])
+    assert instance.query("SELECT * from system.current_roles ORDER BY role_name", user='B') == TSV([["R2", 1, 1]])
+    assert instance.query("SELECT * from system.enabled_roles ORDER BY role_name", user='A') == TSV([["R1", 0, 1, 1]])
+    assert instance.query("SELECT * from system.enabled_roles ORDER BY role_name", user='B') == TSV([["R2", 1, 1, 1]])
diff --git a/tests/integration/test_row_policy/test.py b/tests/integration/test_row_policy/test.py
index dd0495df237..a407f0b2c7a 100644
--- a/tests/integration/test_row_policy/test.py
+++ b/tests/integration/test_row_policy/test.py
@@ -1,20 +1,28 @@
-import pytest
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry, TSV
 import os
 import re
 import time
 
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import assert_eq_with_retry, TSV
+
 cluster = ClickHouseCluster(__file__)
-node = cluster.add_instance('node', main_configs=["configs/config.d/remote_servers.xml"], user_configs=["configs/users.d/row_policy.xml", "configs/users.d/another_user.xml", "configs/users.d/any_join_distinct_right_table_keys.xml"], with_zookeeper=True)
-node2 = cluster.add_instance('node2', main_configs=["configs/config.d/remote_servers.xml"], user_configs=["configs/users.d/row_policy.xml", "configs/users.d/another_user.xml", "configs/users.d/any_join_distinct_right_table_keys.xml"], with_zookeeper=True)
+node = cluster.add_instance('node', main_configs=["configs/config.d/remote_servers.xml"],
+                            user_configs=["configs/users.d/row_policy.xml", "configs/users.d/another_user.xml",
+                                          "configs/users.d/any_join_distinct_right_table_keys.xml"],
+                            with_zookeeper=True)
+node2 = cluster.add_instance('node2', main_configs=["configs/config.d/remote_servers.xml"],
+                             user_configs=["configs/users.d/row_policy.xml", "configs/users.d/another_user.xml",
+                                           "configs/users.d/any_join_distinct_right_table_keys.xml"],
+                             with_zookeeper=True)
 nodes = [node, node2]
 
 
-def copy_policy_xml(local_file_name, reload_immediately = True):
+def copy_policy_xml(local_file_name, reload_immediately=True):
     script_dir = os.path.dirname(os.path.realpath(__file__))
     for current_node in nodes:
-        current_node.copy_file_to_container(os.path.join(script_dir, local_file_name), '/etc/clickhouse-server/users.d/row_policy.xml')
+        current_node.copy_file_to_container(os.path.join(script_dir, local_file_name),
+                                            '/etc/clickhouse-server/users.d/row_policy.xml')
         if reload_immediately:
             current_node.query("SYSTEM RELOAD CONFIG")
 
@@ -66,7 +74,7 @@ def reset_policies():
 
 
 def test_smoke():
-    assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[1,0], [1, 1]])
+    assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[1, 0], [1, 1]])
     assert node.query("SELECT * FROM mydb.filtered_table2") == TSV([[0, 0, 0, 0], [0, 0, 6, 0]])
     assert node.query("SELECT * FROM mydb.filtered_table3") == TSV([[0, 1], [1, 0]])
 
@@ -86,8 +94,12 @@ def test_smoke():
 
 
 def test_join():
-    assert node.query("SELECT * FROM mydb.filtered_table1 as t1 ANY LEFT JOIN mydb.filtered_table1 as t2 ON t1.a = t2.b") == TSV([[1, 0, 1, 1], [1, 1, 1, 1]])
-    assert node.query("SELECT * FROM mydb.filtered_table1 as t2 ANY RIGHT JOIN mydb.filtered_table1 as t1 ON t2.b = t1.a") == TSV([[1, 1, 1, 0]])
+    assert node.query(
+        "SELECT * FROM mydb.filtered_table1 as t1 ANY LEFT JOIN mydb.filtered_table1 as t2 ON t1.a = t2.b") == TSV(
+        [[1, 0, 1, 1], [1, 1, 1, 1]])
+    assert node.query(
+        "SELECT * FROM mydb.filtered_table1 as t2 ANY RIGHT JOIN mydb.filtered_table1 as t1 ON t2.b = t1.a") == TSV(
+        [[1, 1, 1, 0]])
 
 
 def test_cannot_trick_row_policy_with_keyword_with():
@@ -104,17 +116,19 @@ def test_prewhere_not_supported():
     assert expected_error in node.query_and_get_error("SELECT * FROM mydb.filtered_table3 PREWHERE 1")
 
     # However PREWHERE should still work for user without filtering.
-    assert node.query("SELECT * FROM mydb.filtered_table1 PREWHERE 1", user="another") == TSV([[0, 0], [0, 1], [1, 0], [1, 1]])
+    assert node.query("SELECT * FROM mydb.filtered_table1 PREWHERE 1", user="another") == TSV(
+        [[0, 0], [0, 1], [1, 0], [1, 1]])
 
 
 def test_policy_from_users_xml_affects_only_user_assigned():
-    assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[1,0], [1, 1]])
+    assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[1, 0], [1, 1]])
     assert node.query("SELECT * FROM mydb.filtered_table1", user="another") == TSV([[0, 0], [0, 1], [1, 0], [1, 1]])
 
     assert node.query("SELECT * FROM mydb.filtered_table2") == TSV([[0, 0, 0, 0], [0, 0, 6, 0]])
-    assert node.query("SELECT * FROM mydb.filtered_table2", user="another") == TSV([[0, 0, 0, 0], [0, 0, 6, 0], [1, 2, 3, 4], [4, 3, 2, 1]])
+    assert node.query("SELECT * FROM mydb.filtered_table2", user="another") == TSV(
+        [[0, 0, 0, 0], [0, 0, 6, 0], [1, 2, 3, 4], [4, 3, 2, 1]])
 
-    assert node.query("SELECT * FROM mydb.local") == TSV([[1,0], [1, 1], [2, 0], [2, 1]])
+    assert node.query("SELECT * FROM mydb.local") == TSV([[1, 0], [1, 1], [2, 0], [2, 1]])
     assert node.query("SELECT * FROM mydb.local", user="another") == TSV([[1, 0], [1, 1]])
 
 
@@ -126,7 +140,8 @@ def test_change_of_users_xml_changes_row_policies():
 
     copy_policy_xml('all_rows.xml')
     assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[0, 0], [0, 1], [1, 0], [1, 1]])
-    assert node.query("SELECT * FROM mydb.filtered_table2") == TSV([[0, 0, 0, 0], [0, 0, 6, 0], [1, 2, 3, 4], [4, 3, 2, 1]])
+    assert node.query("SELECT * FROM mydb.filtered_table2") == TSV(
+        [[0, 0, 0, 0], [0, 0, 6, 0], [1, 2, 3, 4], [4, 3, 2, 1]])
     assert node.query("SELECT * FROM mydb.filtered_table3") == TSV([[0, 0], [0, 1], [1, 0], [1, 1]])
 
     copy_policy_xml('no_rows.xml')
@@ -141,7 +156,8 @@ def test_change_of_users_xml_changes_row_policies():
 
     copy_policy_xml('no_filters.xml')
     assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[0, 0], [0, 1], [1, 0], [1, 1]])
-    assert node.query("SELECT * FROM mydb.filtered_table2") == TSV([[0, 0, 0, 0], [0, 0, 6, 0], [1, 2, 3, 4], [4, 3, 2, 1]])
+    assert node.query("SELECT * FROM mydb.filtered_table2") == TSV(
+        [[0, 0, 0, 0], [0, 0, 6, 0], [1, 2, 3, 4], [4, 3, 2, 1]])
     assert node.query("SELECT * FROM mydb.filtered_table3") == TSV([[0, 0], [0, 1], [1, 0], [1, 1]])
 
     copy_policy_xml('normal_filters.xml')
@@ -156,13 +172,14 @@ def test_reload_users_xml_by_timer():
     assert node.query("SELECT * FROM mydb.filtered_table2") == TSV([[0, 0, 0, 0], [0, 0, 6, 0]])
     assert node.query("SELECT * FROM mydb.filtered_table3") == TSV([[0, 1], [1, 0]])
 
-    time.sleep(1) # The modification time of the 'row_policy.xml' file should be different.
+    time.sleep(1)  # The modification time of the 'row_policy.xml' file should be different.
     copy_policy_xml('all_rows.xml', False)
     assert_eq_with_retry(node, "SELECT * FROM mydb.filtered_table1", [[0, 0], [0, 1], [1, 0], [1, 1]])
-    assert_eq_with_retry(node, "SELECT * FROM mydb.filtered_table2", [[0, 0, 0, 0], [0, 0, 6, 0], [1, 2, 3, 4], [4, 3, 2, 1]])
+    assert_eq_with_retry(node, "SELECT * FROM mydb.filtered_table2",
+                         [[0, 0, 0, 0], [0, 0, 6, 0], [1, 2, 3, 4], [4, 3, 2, 1]])
     assert_eq_with_retry(node, "SELECT * FROM mydb.filtered_table3", [[0, 0], [0, 1], [1, 0], [1, 1]])
 
-    time.sleep(1) # The modification time of the 'row_policy.xml' file should be different.
+    time.sleep(1)  # The modification time of the 'row_policy.xml' file should be different.
     copy_policy_xml('normal_filters.xml', False)
     assert_eq_with_retry(node, "SELECT * FROM mydb.filtered_table1", [[1, 0], [1, 1]])
     assert_eq_with_retry(node, "SELECT * FROM mydb.filtered_table2", [[0, 0, 0, 0], [0, 0, 6, 0]])
@@ -171,57 +188,109 @@ def test_reload_users_xml_by_timer():
 
 def test_introspection():
     policies = [
-        ["another ON mydb.filtered_table1", "another", "mydb", "filtered_table1", "6068883a-0e9d-f802-7e22-0144f8e66d3c", "users.xml", "1",                      0, 0, "['another']", "[]"],
-        ["another ON mydb.filtered_table2", "another", "mydb", "filtered_table2", "c019e957-c60b-d54e-cc52-7c90dac5fb01", "users.xml", "1",                      0, 0, "['another']", "[]"],
-        ["another ON mydb.filtered_table3", "another", "mydb", "filtered_table3", "4cb080d0-44e8-dbef-6026-346655143628", "users.xml", "1",                      0, 0, "['another']", "[]"],
-        ["another ON mydb.local",           "another", "mydb", "local",           "5b23c389-7e18-06bf-a6bc-dd1afbbc0a97", "users.xml", "a = 1",                  0, 0, "['another']", "[]"],
-        ["default ON mydb.filtered_table1", "default", "mydb", "filtered_table1", "9e8a8f62-4965-2b5e-8599-57c7b99b3549", "users.xml", "a = 1",                  0, 0, "['default']", "[]"],
-        ["default ON mydb.filtered_table2", "default", "mydb", "filtered_table2", "cffae79d-b9bf-a2ef-b798-019c18470b25", "users.xml", "a + b < 1 or c - d > 5", 0, 0, "['default']", "[]"],
-        ["default ON mydb.filtered_table3", "default", "mydb", "filtered_table3", "12fc5cef-e3da-3940-ec79-d8be3911f42b", "users.xml", "c = 1",                  0, 0, "['default']", "[]"],
-        ["default ON mydb.local",           "default", "mydb", "local",           "cdacaeb5-1d97-f99d-2bb0-4574f290629c", "users.xml", "1",                      0, 0, "['default']", "[]"]
+        ["another ON mydb.filtered_table1", "another", "mydb", "filtered_table1",
+         "6068883a-0e9d-f802-7e22-0144f8e66d3c", "users.xml", "1", 0, 0, "['another']", "[]"],
+        ["another ON mydb.filtered_table2", "another", "mydb", "filtered_table2",
+         "c019e957-c60b-d54e-cc52-7c90dac5fb01", "users.xml", "1", 0, 0, "['another']", "[]"],
+        ["another ON mydb.filtered_table3", "another", "mydb", "filtered_table3",
+         "4cb080d0-44e8-dbef-6026-346655143628", "users.xml", "1", 0, 0, "['another']", "[]"],
+        ["another ON mydb.local", "another", "mydb", "local", "5b23c389-7e18-06bf-a6bc-dd1afbbc0a97", "users.xml",
+         "a = 1", 0, 0, "['another']", "[]"],
+        ["default ON mydb.filtered_table1", "default", "mydb", "filtered_table1",
+         "9e8a8f62-4965-2b5e-8599-57c7b99b3549", "users.xml", "a = 1", 0, 0, "['default']", "[]"],
+        ["default ON mydb.filtered_table2", "default", "mydb", "filtered_table2",
+         "cffae79d-b9bf-a2ef-b798-019c18470b25", "users.xml", "a + b < 1 or c - d > 5", 0, 0, "['default']", "[]"],
+        ["default ON mydb.filtered_table3", "default", "mydb", "filtered_table3",
+         "12fc5cef-e3da-3940-ec79-d8be3911f42b", "users.xml", "c = 1", 0, 0, "['default']", "[]"],
+        ["default ON mydb.local", "default", "mydb", "local", "cdacaeb5-1d97-f99d-2bb0-4574f290629c", "users.xml", "1",
+         0, 0, "['default']", "[]"]
     ]
     assert node.query("SELECT * from system.row_policies ORDER BY short_name, database, table") == TSV(policies)
 
 
 def test_dcl_introspection():
-    assert node.query("SHOW POLICIES") == TSV(["another ON mydb.filtered_table1", "another ON mydb.filtered_table2", "another ON mydb.filtered_table3", "another ON mydb.local", "default ON mydb.filtered_table1", "default ON mydb.filtered_table2", "default ON mydb.filtered_table3", "default ON mydb.local"])
+    assert node.query("SHOW POLICIES") == TSV(
+        ["another ON mydb.filtered_table1", "another ON mydb.filtered_table2", "another ON mydb.filtered_table3",
+         "another ON mydb.local", "default ON mydb.filtered_table1", "default ON mydb.filtered_table2",
+         "default ON mydb.filtered_table3", "default ON mydb.local"])
 
-    assert node.query("SHOW POLICIES ON mydb.filtered_table1") == TSV([ "another", "default" ])
-    assert node.query("SHOW POLICIES ON mydb.local") == TSV([ "another", "default" ])
-    assert node.query("SHOW POLICIES ON mydb.*") == TSV([ "another ON mydb.filtered_table1", "another ON mydb.filtered_table2", "another ON mydb.filtered_table3", "another ON mydb.local", "default ON mydb.filtered_table1", "default ON mydb.filtered_table2", "default ON mydb.filtered_table3", "default ON mydb.local" ])
-    assert node.query("SHOW POLICIES default") == TSV([ "default ON mydb.filtered_table1", "default ON mydb.filtered_table2", "default ON mydb.filtered_table3", "default ON mydb.local" ])
+    assert node.query("SHOW POLICIES ON mydb.filtered_table1") == TSV(["another", "default"])
+    assert node.query("SHOW POLICIES ON mydb.local") == TSV(["another", "default"])
+    assert node.query("SHOW POLICIES ON mydb.*") == TSV(
+        ["another ON mydb.filtered_table1", "another ON mydb.filtered_table2", "another ON mydb.filtered_table3",
+         "another ON mydb.local", "default ON mydb.filtered_table1", "default ON mydb.filtered_table2",
+         "default ON mydb.filtered_table3", "default ON mydb.local"])
+    assert node.query("SHOW POLICIES default") == TSV(
+        ["default ON mydb.filtered_table1", "default ON mydb.filtered_table2", "default ON mydb.filtered_table3",
+         "default ON mydb.local"])
 
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table1") == "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default\n"
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table2") == "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default\n"
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table3") == "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default\n"
-    assert node.query("SHOW CREATE POLICY default ON mydb.local") == "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table1") == "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table2") == "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table3") == "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.local") == "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default\n"
 
-    assert node.query("SHOW CREATE POLICY default") == TSV([ "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default", "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default", "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default", "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default" ])
-    assert node.query("SHOW CREATE POLICIES ON mydb.filtered_table1") == TSV([ "CREATE ROW POLICY another ON mydb.filtered_table1 FOR SELECT USING 1 TO another", "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default" ])
-    assert node.query("SHOW CREATE POLICIES ON mydb.*") == TSV([ "CREATE ROW POLICY another ON mydb.filtered_table1 FOR SELECT USING 1 TO another", "CREATE ROW POLICY another ON mydb.filtered_table2 FOR SELECT USING 1 TO another", "CREATE ROW POLICY another ON mydb.filtered_table3 FOR SELECT USING 1 TO another", "CREATE ROW POLICY another ON mydb.local FOR SELECT USING a = 1 TO another", "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default", "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default", "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default", "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default" ])
-    assert node.query("SHOW CREATE POLICIES") == TSV([ "CREATE ROW POLICY another ON mydb.filtered_table1 FOR SELECT USING 1 TO another", "CREATE ROW POLICY another ON mydb.filtered_table2 FOR SELECT USING 1 TO another", "CREATE ROW POLICY another ON mydb.filtered_table3 FOR SELECT USING 1 TO another", "CREATE ROW POLICY another ON mydb.local FOR SELECT USING a = 1 TO another", "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default", "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default", "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default", "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default" ])
+    assert node.query("SHOW CREATE POLICY default") == TSV(
+        ["CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default",
+         "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default",
+         "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default",
+         "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default"])
+    assert node.query("SHOW CREATE POLICIES ON mydb.filtered_table1") == TSV(
+        ["CREATE ROW POLICY another ON mydb.filtered_table1 FOR SELECT USING 1 TO another",
+         "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default"])
+    assert node.query("SHOW CREATE POLICIES ON mydb.*") == TSV(
+        ["CREATE ROW POLICY another ON mydb.filtered_table1 FOR SELECT USING 1 TO another",
+         "CREATE ROW POLICY another ON mydb.filtered_table2 FOR SELECT USING 1 TO another",
+         "CREATE ROW POLICY another ON mydb.filtered_table3 FOR SELECT USING 1 TO another",
+         "CREATE ROW POLICY another ON mydb.local FOR SELECT USING a = 1 TO another",
+         "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default",
+         "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default",
+         "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default",
+         "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default"])
+    assert node.query("SHOW CREATE POLICIES") == TSV(
+        ["CREATE ROW POLICY another ON mydb.filtered_table1 FOR SELECT USING 1 TO another",
+         "CREATE ROW POLICY another ON mydb.filtered_table2 FOR SELECT USING 1 TO another",
+         "CREATE ROW POLICY another ON mydb.filtered_table3 FOR SELECT USING 1 TO another",
+         "CREATE ROW POLICY another ON mydb.local FOR SELECT USING a = 1 TO another",
+         "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default",
+         "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default",
+         "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default",
+         "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default"])
 
-    expected_access = "CREATE ROW POLICY another ON mydb.filtered_table1 FOR SELECT USING 1 TO another\n"\
-                      "CREATE ROW POLICY another ON mydb.filtered_table2 FOR SELECT USING 1 TO another\n"\
-                      "CREATE ROW POLICY another ON mydb.filtered_table3 FOR SELECT USING 1 TO another\n"\
-                      "CREATE ROW POLICY another ON mydb.local FOR SELECT USING a = 1 TO another\n"\
-                      "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default\n"\
-                      "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default\n"\
-                      "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default\n"\
+    expected_access = "CREATE ROW POLICY another ON mydb.filtered_table1 FOR SELECT USING 1 TO another\n" \
+                      "CREATE ROW POLICY another ON mydb.filtered_table2 FOR SELECT USING 1 TO another\n" \
+                      "CREATE ROW POLICY another ON mydb.filtered_table3 FOR SELECT USING 1 TO another\n" \
+                      "CREATE ROW POLICY another ON mydb.local FOR SELECT USING a = 1 TO another\n" \
+                      "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING a = 1 TO default\n" \
+                      "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING ((a + b) < 1) OR ((c - d) > 5) TO default\n" \
+                      "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 1 TO default\n" \
                       "CREATE ROW POLICY default ON mydb.local FOR SELECT USING 1 TO default\n"
     assert expected_access in node.query("SHOW ACCESS")
 
     copy_policy_xml('all_rows.xml')
-    assert node.query("SHOW POLICIES") == TSV(["another ON mydb.filtered_table1", "another ON mydb.filtered_table2", "another ON mydb.filtered_table3", "default ON mydb.filtered_table1", "default ON mydb.filtered_table2", "default ON mydb.filtered_table3"])
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table1") == "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING 1 TO default\n"
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table2") == "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING 1 TO default\n"
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table3") == "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING 1 TO default\n"
+    assert node.query("SHOW POLICIES") == TSV(
+        ["another ON mydb.filtered_table1", "another ON mydb.filtered_table2", "another ON mydb.filtered_table3",
+         "default ON mydb.filtered_table1", "default ON mydb.filtered_table2", "default ON mydb.filtered_table3"])
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table1") == "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING 1 TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table2") == "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING 1 TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table3") == "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING 1 TO default\n"
 
     copy_policy_xml('no_rows.xml')
-    assert node.query("SHOW POLICIES") == TSV(["another ON mydb.filtered_table1", "another ON mydb.filtered_table2", "another ON mydb.filtered_table3", "default ON mydb.filtered_table1", "default ON mydb.filtered_table2", "default ON mydb.filtered_table3"])
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table1") == "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING NULL TO default\n"
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table2") == "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING NULL TO default\n"
-    assert node.query("SHOW CREATE POLICY default ON mydb.filtered_table3") == "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING NULL TO default\n"
+    assert node.query("SHOW POLICIES") == TSV(
+        ["another ON mydb.filtered_table1", "another ON mydb.filtered_table2", "another ON mydb.filtered_table3",
+         "default ON mydb.filtered_table1", "default ON mydb.filtered_table2", "default ON mydb.filtered_table3"])
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table1") == "CREATE ROW POLICY default ON mydb.filtered_table1 FOR SELECT USING NULL TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table2") == "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING NULL TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY default ON mydb.filtered_table3") == "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING NULL TO default\n"
 
     copy_policy_xml('no_filters.xml')
     assert node.query("SHOW POLICIES") == ""
@@ -245,7 +314,8 @@ def test_dcl_management():
     node.query("ALTER POLICY pA ON mydb.filtered_table1 RENAME TO pB")
     assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[1, 0]])
     assert node.query("SHOW POLICIES ON mydb.filtered_table1") == "pB\n"
-    assert node.query("SHOW CREATE POLICY pB ON mydb.filtered_table1") == "CREATE ROW POLICY pB ON mydb.filtered_table1 FOR SELECT USING a > b TO default\n"
+    assert node.query(
+        "SHOW CREATE POLICY pB ON mydb.filtered_table1") == "CREATE ROW POLICY pB ON mydb.filtered_table1 FOR SELECT USING a > b TO default\n"
 
     node.query("DROP POLICY pB ON mydb.filtered_table1")
     assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[0, 0], [0, 1], [1, 0], [1, 1]])
@@ -258,16 +328,17 @@ def test_users_xml_is_readonly():
 
 def test_tags_with_db_and_table_names():
     copy_policy_xml('tags_with_db_and_table_names.xml')
-    
+
     assert node.query("SELECT * FROM mydb.table") == TSV([[0, 0], [0, 1]])
     assert node.query("SELECT * FROM mydb.filtered_table2") == TSV([[0, 0, 6, 0]])
     assert node.query("SELECT * FROM mydb.filtered_table3") == TSV([[0, 0]])
     assert node.query("SELECT * FROM mydb.`.filtered_table4`") == TSV([[1, 1]])
 
-    assert node.query("SHOW CREATE POLICIES default") == TSV(["CREATE ROW POLICY default ON mydb.`.filtered_table4` FOR SELECT USING c = 2 TO default",
-                                                              "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING c > (d + 5) TO default",
-                                                              "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 0 TO default",
-                                                              "CREATE ROW POLICY default ON mydb.table FOR SELECT USING a = 0 TO default"])
+    assert node.query("SHOW CREATE POLICIES default") == TSV(
+        ["CREATE ROW POLICY default ON mydb.`.filtered_table4` FOR SELECT USING c = 2 TO default",
+         "CREATE ROW POLICY default ON mydb.filtered_table2 FOR SELECT USING c > (d + 5) TO default",
+         "CREATE ROW POLICY default ON mydb.filtered_table3 FOR SELECT USING c = 0 TO default",
+         "CREATE ROW POLICY default ON mydb.table FOR SELECT USING a = 0 TO default"])
 
 
 def test_miscellaneous_engines():
@@ -275,7 +346,8 @@ def test_miscellaneous_engines():
 
     # ReplicatedMergeTree
     node.query("DROP TABLE mydb.filtered_table1")
-    node.query("CREATE TABLE mydb.filtered_table1 (a UInt8, b UInt8) ENGINE ReplicatedMergeTree('/clickhouse/tables/00-00/filtered_table1', 'replica1') ORDER BY a")
+    node.query(
+        "CREATE TABLE mydb.filtered_table1 (a UInt8, b UInt8) ENGINE ReplicatedMergeTree('/clickhouse/tables/00-00/filtered_table1', 'replica1') ORDER BY a")
     node.query("INSERT INTO mydb.filtered_table1 values (0, 0), (0, 1), (1, 0), (1, 1)")
     assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[1, 0], [1, 1]])
 
@@ -287,12 +359,15 @@ def test_miscellaneous_engines():
 
     # ReplicatedCollapsingMergeTree
     node.query("DROP TABLE mydb.filtered_table1")
-    node.query("CREATE TABLE mydb.filtered_table1 (a UInt8, b Int8) ENGINE ReplicatedCollapsingMergeTree('/clickhouse/tables/00-00/filtered_table1', 'replica1', b) ORDER BY a")
+    node.query(
+        "CREATE TABLE mydb.filtered_table1 (a UInt8, b Int8) ENGINE ReplicatedCollapsingMergeTree('/clickhouse/tables/00-00/filtered_table1', 'replica1', b) ORDER BY a")
     node.query("INSERT INTO mydb.filtered_table1 values (0, 1), (0, 1), (1, 1), (1, 1)")
     assert node.query("SELECT * FROM mydb.filtered_table1") == TSV([[1, 1], [1, 1]])
 
     # DistributedMergeTree
     node.query("DROP TABLE IF EXISTS mydb.not_filtered_table")
-    node.query("CREATE TABLE mydb.not_filtered_table (a UInt8, b UInt8) ENGINE Distributed('test_local_cluster', mydb, local)")
+    node.query(
+        "CREATE TABLE mydb.not_filtered_table (a UInt8, b UInt8) ENGINE Distributed('test_local_cluster', mydb, local)")
     assert node.query("SELECT * FROM mydb.not_filtered_table", user="another") == TSV([[1, 0], [1, 1], [1, 0], [1, 1]])
-    assert node.query("SELECT sum(a), b FROM mydb.not_filtered_table GROUP BY b ORDER BY b", user="another") == TSV([[2, 0], [2, 1]])
+    assert node.query("SELECT sum(a), b FROM mydb.not_filtered_table GROUP BY b ORDER BY b", user="another") == TSV(
+        [[2, 0], [2, 1]])
diff --git a/tests/integration/test_s3_with_https/test.py b/tests/integration/test_s3_with_https/test.py
index 2b40e02e701..17f24bba794 100644
--- a/tests/integration/test_s3_with_https/test.py
+++ b/tests/integration/test_s3_with_https/test.py
@@ -18,7 +18,9 @@ def check_proxy_logs(cluster, proxy_instance):
 def cluster():
     try:
         cluster = ClickHouseCluster(__file__)
-        cluster.add_instance("node", main_configs=["configs/config.d/storage_conf.xml", "configs/config.d/log_conf.xml", "configs/config.d/ssl.xml"], with_minio=True, minio_certs_dir='minio_certs')
+        cluster.add_instance("node", main_configs=["configs/config.d/storage_conf.xml", "configs/config.d/log_conf.xml",
+                                                   "configs/config.d/ssl.xml"], with_minio=True,
+                             minio_certs_dir='minio_certs')
         logging.info("Starting cluster...")
         cluster.start()
         logging.info("Cluster started")
@@ -43,7 +45,7 @@ def test_s3_with_https(cluster, policy):
         ORDER BY id
         SETTINGS storage_policy='{}'
         """
-        .format(policy)
+            .format(policy)
     )
 
     node.query("INSERT INTO s3_test VALUES (0,'data'),(1,'data')")
diff --git a/tests/integration/test_s3_with_proxy/proxy-resolver/resolver.py b/tests/integration/test_s3_with_proxy/proxy-resolver/resolver.py
index 520c018cbad..87fe4ce30f6 100644
--- a/tests/integration/test_s3_with_proxy/proxy-resolver/resolver.py
+++ b/tests/integration/test_s3_with_proxy/proxy-resolver/resolver.py
@@ -1,6 +1,7 @@
-import bottle
 import random
 
+import bottle
+
 
 @bottle.route('/hostname')
 def index():
diff --git a/tests/integration/test_s3_with_proxy/test.py b/tests/integration/test_s3_with_proxy/test.py
index daf53c2e27b..9df209826f9 100644
--- a/tests/integration/test_s3_with_proxy/test.py
+++ b/tests/integration/test_s3_with_proxy/test.py
@@ -21,7 +21,9 @@ def run_resolver(cluster):
 def cluster():
     try:
         cluster = ClickHouseCluster(__file__)
-        cluster.add_instance("node", main_configs=["configs/config.d/log_conf.xml", "configs/config.d/storage_conf.xml"], with_minio=True)
+        cluster.add_instance("node",
+                             main_configs=["configs/config.d/log_conf.xml", "configs/config.d/storage_conf.xml"],
+                             with_minio=True)
         logging.info("Starting cluster...")
         cluster.start()
         logging.info("Cluster started")
@@ -56,7 +58,7 @@ def test_s3_with_proxy_list(cluster, policy):
         ORDER BY id
         SETTINGS storage_policy='{}'
         """
-        .format(policy)
+            .format(policy)
     )
 
     node.query("INSERT INTO s3_test VALUES (0,'data'),(1,'data')")
diff --git a/tests/integration/test_send_crash_reports/fake_sentry_server.py b/tests/integration/test_send_crash_reports/fake_sentry_server.py
index 74f0592504f..49463bdb133 100644
--- a/tests/integration/test_send_crash_reports/fake_sentry_server.py
+++ b/tests/integration/test_send_crash_reports/fake_sentry_server.py
@@ -2,6 +2,7 @@ import BaseHTTPServer
 
 RESULT_PATH = '/result.txt'
 
+
 class SentryHandler(BaseHTTPServer.BaseHTTPRequestHandler):
     def do_POST(self):
         post_data = self.__read_and_decode_post_data()
diff --git a/tests/integration/test_send_crash_reports/test.py b/tests/integration/test_send_crash_reports/test.py
index ff4b55da99b..4c832d9d67c 100644
--- a/tests/integration/test_send_crash_reports/test.py
+++ b/tests/integration/test_send_crash_reports/test.py
@@ -1,12 +1,11 @@
 import os
 import time
 
-import pytest
-
 import helpers.cluster
 import helpers.test_tools
-import fake_sentry_server
+import pytest
 
+import fake_sentry_server
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 
@@ -24,7 +23,7 @@ def started_node():
         cluster.shutdown()
 
 
-def test_send_segfault(started_node,):
+def test_send_segfault(started_node, ):
     started_node.copy_file_to_container(os.path.join(SCRIPT_DIR, "fake_sentry_server.py"), "/fake_sentry_server.py")
     started_node.exec_in_container(["bash", "-c", "python2 /fake_sentry_server.py"], detach=True, user="root")
     time.sleep(0.5)
diff --git a/tests/integration/test_send_request_to_leader_replica/test.py b/tests/integration/test_send_request_to_leader_replica/test.py
index 913a5e6ff7a..8c58d02d104 100644
--- a/tests/integration/test_send_request_to_leader_replica/test.py
+++ b/tests/integration/test_send_request_to_leader_replica/test.py
@@ -1,5 +1,3 @@
-import time
-
 import pytest
 
 from helpers.cluster import ClickHouseCluster
@@ -7,17 +5,21 @@ from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
-node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'], user_configs=['configs/user_good_restricted.xml'], with_zookeeper=True)
-node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'], user_configs=['configs/user_good_restricted.xml'], with_zookeeper=True)
-node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml'], user_configs=['configs/user_good_allowed.xml'], with_zookeeper=True)
-node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml'], user_configs=['configs/user_good_allowed.xml'], with_zookeeper=True)
+node1 = cluster.add_instance('node1', main_configs=['configs/remote_servers.xml'],
+                             user_configs=['configs/user_good_restricted.xml'], with_zookeeper=True)
+node2 = cluster.add_instance('node2', main_configs=['configs/remote_servers.xml'],
+                             user_configs=['configs/user_good_restricted.xml'], with_zookeeper=True)
+node3 = cluster.add_instance('node3', main_configs=['configs/remote_servers.xml'],
+                             user_configs=['configs/user_good_allowed.xml'], with_zookeeper=True)
+node4 = cluster.add_instance('node4', main_configs=['configs/remote_servers.xml'],
+                             user_configs=['configs/user_good_allowed.xml'], with_zookeeper=True)
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
         cluster.start()
 
-
         for node in [node1, node2]:
             node.query('''
             CREATE TABLE sometable(date Date, id UInt32, value Int32)
@@ -30,18 +32,18 @@ def started_cluster():
     ENGINE = ReplicatedMergeTree('/clickhouse/tables/0/someothertable', '{replica}', date, id, 8192);
                 '''.format(replica=node.name), user='good')
 
-
         yield cluster
 
     finally:
         cluster.shutdown()
 
+
 @pytest.mark.parametrize("table,query,expected,n1,n2", [
-    ("sometable","ALTER TABLE sometable DROP PARTITION 201706", '1', node1, node2),
-    ("sometable","TRUNCATE TABLE sometable", '0', node1, node2),
+    ("sometable", "ALTER TABLE sometable DROP PARTITION 201706", '1', node1, node2),
+    ("sometable", "TRUNCATE TABLE sometable", '0', node1, node2),
     ("sometable", "OPTIMIZE TABLE sometable", '4', node1, node2),
-    ("someothertable","ALTER TABLE someothertable DROP PARTITION 201706", '1', node3, node4),
-    ("someothertable","TRUNCATE TABLE someothertable", '0', node3, node4),
+    ("someothertable", "ALTER TABLE someothertable DROP PARTITION 201706", '1', node3, node4),
+    ("someothertable", "TRUNCATE TABLE someothertable", '0', node3, node4),
     ("someothertable", "OPTIMIZE TABLE someothertable", '4', node3, node4),
 ])
 def test_alter_table_drop_partition(started_cluster, table, query, expected, n1, n2):
diff --git a/tests/integration/test_server_initialization/test.py b/tests/integration/test_server_initialization/test.py
index ebf50e7dc51..08032436982 100644
--- a/tests/integration/test_server_initialization/test.py
+++ b/tests/integration/test_server_initialization/test.py
@@ -1,8 +1,8 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -14,7 +14,7 @@ def started_cluster():
         instance_fail = cluster_fail.add_instance('dummy_fail', clickhouse_path_dir='clickhouse_path_fail')
         with pytest.raises(Exception):
             cluster_fail.start()
-        cluster_fail.shutdown() # cleanup
+        cluster_fail.shutdown()  # cleanup
 
         yield cluster
 
@@ -30,9 +30,10 @@ def test_sophisticated_default(started_cluster):
 
 def test_partially_dropped_tables(started_cluster):
     instance = started_cluster.instances['dummy']
-    assert instance.exec_in_container(['bash', '-c', 'find /var/lib/clickhouse/*/default -name *.sql* | sort'], privileged=True, user='root') \
-          == "/var/lib/clickhouse/metadata/default/should_be_restored.sql\n" \
-             "/var/lib/clickhouse/metadata/default/sophisticated_default.sql\n"
+    assert instance.exec_in_container(['bash', '-c', 'find /var/lib/clickhouse/*/default -name *.sql* | sort'],
+                                      privileged=True, user='root') \
+           == "/var/lib/clickhouse/metadata/default/should_be_restored.sql\n" \
+              "/var/lib/clickhouse/metadata/default/sophisticated_default.sql\n"
     assert instance.query("SELECT n FROM should_be_restored") == "1\n2\n3\n"
     assert instance.query("SELECT count() FROM system.tables WHERE name='should_be_dropped'") == "0\n"
 
@@ -42,5 +43,6 @@ def test_live_view_dependency(started_cluster):
     instance.query("CREATE DATABASE a_load_first")
     instance.query("CREATE DATABASE b_load_second")
     instance.query("CREATE TABLE b_load_second.mt (a Int32) Engine=MergeTree order by tuple()")
-    instance.query("CREATE LIVE VIEW a_load_first.lv AS SELECT sum(a) FROM b_load_second.mt", settings={'allow_experimental_live_view': 1})
+    instance.query("CREATE LIVE VIEW a_load_first.lv AS SELECT sum(a) FROM b_load_second.mt",
+                   settings={'allow_experimental_live_view': 1})
     instance.restart_clickhouse()
diff --git a/tests/integration/test_settings_constraints/test.py b/tests/integration/test_settings_constraints/test.py
index b2dcd80448f..90e639685f0 100644
--- a/tests/integration/test_settings_constraints/test.py
+++ b/tests/integration/test_settings_constraints/test.py
@@ -5,8 +5,6 @@ cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance', user_configs=["configs/users.xml"])
 
 
-
-
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -18,13 +16,15 @@ def started_cluster():
 
 
 def test_system_settings(started_cluster):
-    assert instance.query("SELECT name, value, min, max, readonly from system.settings WHERE name = 'force_index_by_date'") ==\
+    assert instance.query(
+        "SELECT name, value, min, max, readonly from system.settings WHERE name = 'force_index_by_date'") == \
            "force_index_by_date\t0\t\\N\t\\N\t1\n"
 
-    assert instance.query("SELECT name, value, min, max, readonly from system.settings WHERE name = 'max_memory_usage'") ==\
+    assert instance.query(
+        "SELECT name, value, min, max, readonly from system.settings WHERE name = 'max_memory_usage'") == \
            "max_memory_usage\t10000000000\t5000000000\t20000000000\t0\n"
 
-    assert instance.query("SELECT name, value, min, max, readonly from system.settings WHERE name = 'readonly'") ==\
+    assert instance.query("SELECT name, value, min, max, readonly from system.settings WHERE name = 'readonly'") == \
            "readonly\t0\t\\N\t\\N\t0\n"
 
 
diff --git a/tests/integration/test_settings_constraints_distributed/test.py b/tests/integration/test_settings_constraints_distributed/test.py
index 94afa0d6d2d..acb73f0ef49 100644
--- a/tests/integration/test_settings_constraints_distributed/test.py
+++ b/tests/integration/test_settings_constraints_distributed/test.py
@@ -1,16 +1,16 @@
-import time
-
 import pytest
 
-from helpers.client import QueryRuntimeException
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
-node1 = cluster.add_instance('node1', main_configs=["configs/config.d/remote_servers.xml"], user_configs=["configs/users.d/allow_introspection_functions.xml"])
-node2 = cluster.add_instance('node2', main_configs=["configs/config.d/remote_servers.xml"], user_configs=["configs/users.d/allow_introspection_functions.xml"])
-distributed = cluster.add_instance('distributed', main_configs=["configs/config.d/remote_servers.xml"], user_configs=["configs/users.d/allow_introspection_functions.xml"], stay_alive=True)
+node1 = cluster.add_instance('node1', main_configs=["configs/config.d/remote_servers.xml"],
+                             user_configs=["configs/users.d/allow_introspection_functions.xml"])
+node2 = cluster.add_instance('node2', main_configs=["configs/config.d/remote_servers.xml"],
+                             user_configs=["configs/users.d/allow_introspection_functions.xml"])
+distributed = cluster.add_instance('distributed', main_configs=["configs/config.d/remote_servers.xml"],
+                                   user_configs=["configs/users.d/allow_introspection_functions.xml"], stay_alive=True)
 
 
 @pytest.fixture(scope="module", autouse=True)
@@ -24,8 +24,10 @@ def started_cluster():
             node.query("CREATE USER shard")
             node.query("GRANT ALL ON *.* TO shard")
 
-        distributed.query("CREATE TABLE proxy (date Date, id UInt32, value Int32) ENGINE = Distributed(test_cluster, default, sometable, toUInt64(date));")
-        distributed.query("CREATE TABLE shard_settings (name String, value String) ENGINE = Distributed(test_cluster, system, settings);")
+        distributed.query(
+            "CREATE TABLE proxy (date Date, id UInt32, value Int32) ENGINE = Distributed(test_cluster, default, sometable, toUInt64(date));")
+        distributed.query(
+            "CREATE TABLE shard_settings (name String, value String) ENGINE = Distributed(test_cluster, system, settings);")
         distributed.query("CREATE ROLE admin")
         distributed.query("GRANT ALL ON *.* TO admin")
 
@@ -53,49 +55,52 @@ def test_select_clamps_settings():
     # Check that shards doesn't throw exceptions on constraints violation
     query = "SELECT COUNT() FROM proxy"
     assert distributed.query(query) == '2\n'
-    assert distributed.query(query, user = 'normal') == '2\n'
-    assert distributed.query(query, user = 'wasteful') == '2\n'
-    assert distributed.query(query, user = 'readonly') == '2\n'
+    assert distributed.query(query, user='normal') == '2\n'
+    assert distributed.query(query, user='wasteful') == '2\n'
+    assert distributed.query(query, user='readonly') == '2\n'
 
     assert distributed.query(query, settings={"max_memory_usage": 40000000, "readonly": 2}) == '2\n'
     assert distributed.query(query, settings={"max_memory_usage": 3000000000, "readonly": 2}) == '2\n'
 
     query = "SELECT COUNT() FROM remote('node{1,2}', 'default', 'sometable')"
     assert distributed.query(query) == '2\n'
-    assert distributed.query(query, user = 'normal') == '2\n'
-    assert distributed.query(query, user = 'wasteful') == '2\n'
+    assert distributed.query(query, user='normal') == '2\n'
+    assert distributed.query(query, user='wasteful') == '2\n'
 
     # Check that shards clamp passed settings.
     query = "SELECT hostName() as host, name, value FROM shard_settings WHERE name = 'max_memory_usage' OR name = 'readonly' ORDER BY host, name, value"
-    assert distributed.query(query) == 'node1\tmax_memory_usage\t99999999\n'\
-                                       'node1\treadonly\t0\n'\
-                                       'node2\tmax_memory_usage\t10000000000\n'\
+    assert distributed.query(query) == 'node1\tmax_memory_usage\t99999999\n' \
+                                       'node1\treadonly\t0\n' \
+                                       'node2\tmax_memory_usage\t10000000000\n' \
                                        'node2\treadonly\t1\n'
-    assert distributed.query(query, user = 'normal') == 'node1\tmax_memory_usage\t80000000\n'\
-                                                        'node1\treadonly\t0\n'\
-                                                        'node2\tmax_memory_usage\t10000000000\n'\
+    assert distributed.query(query, user='normal') == 'node1\tmax_memory_usage\t80000000\n' \
+                                                      'node1\treadonly\t0\n' \
+                                                      'node2\tmax_memory_usage\t10000000000\n' \
+                                                      'node2\treadonly\t1\n'
+    assert distributed.query(query, user='wasteful') == 'node1\tmax_memory_usage\t99999999\n' \
+                                                        'node1\treadonly\t0\n' \
+                                                        'node2\tmax_memory_usage\t10000000000\n' \
+                                                        'node2\treadonly\t1\n'
+    assert distributed.query(query, user='readonly') == 'node1\tmax_memory_usage\t99999999\n' \
+                                                        'node1\treadonly\t1\n' \
+                                                        'node2\tmax_memory_usage\t10000000000\n' \
                                                         'node2\treadonly\t1\n'
-    assert distributed.query(query, user = 'wasteful') == 'node1\tmax_memory_usage\t99999999\n'\
-                                                          'node1\treadonly\t0\n'\
-                                                          'node2\tmax_memory_usage\t10000000000\n'\
-                                                          'node2\treadonly\t1\n'
-    assert distributed.query(query, user = 'readonly') == 'node1\tmax_memory_usage\t99999999\n'\
-                                                          'node1\treadonly\t1\n'\
-                                                          'node2\tmax_memory_usage\t10000000000\n'\
-                                                          'node2\treadonly\t1\n'
 
-    assert distributed.query(query, settings={"max_memory_usage": 1}) == 'node1\tmax_memory_usage\t11111111\n'\
-                                                                         'node1\treadonly\t0\n'\
-                                                                         'node2\tmax_memory_usage\t10000000000\n'\
+    assert distributed.query(query, settings={"max_memory_usage": 1}) == 'node1\tmax_memory_usage\t11111111\n' \
+                                                                         'node1\treadonly\t0\n' \
+                                                                         'node2\tmax_memory_usage\t10000000000\n' \
                                                                          'node2\treadonly\t1\n'
-    assert distributed.query(query, settings={"max_memory_usage": 40000000, "readonly": 2}) == 'node1\tmax_memory_usage\t40000000\n'\
-                                                                                               'node1\treadonly\t2\n'\
-                                                                                               'node2\tmax_memory_usage\t10000000000\n'\
-                                                                                               'node2\treadonly\t1\n'
-    assert distributed.query(query, settings={"max_memory_usage": 3000000000, "readonly": 2}) == 'node1\tmax_memory_usage\t99999999\n'\
-                                                                                                 'node1\treadonly\t2\n'\
-                                                                                                 'node2\tmax_memory_usage\t10000000000\n'\
-                                                                                                 'node2\treadonly\t1\n'
+    assert distributed.query(query, settings={"max_memory_usage": 40000000,
+                                              "readonly": 2}) == 'node1\tmax_memory_usage\t40000000\n' \
+                                                                 'node1\treadonly\t2\n' \
+                                                                 'node2\tmax_memory_usage\t10000000000\n' \
+                                                                 'node2\treadonly\t1\n'
+    assert distributed.query(query, settings={"max_memory_usage": 3000000000,
+                                              "readonly": 2}) == 'node1\tmax_memory_usage\t99999999\n' \
+                                                                 'node1\treadonly\t2\n' \
+                                                                 'node2\tmax_memory_usage\t10000000000\n' \
+                                                                 'node2\treadonly\t1\n'
+
 
 def test_insert_clamps_settings():
     node1.query("ALTER USER shard SETTINGS max_memory_usage = 50000000 MIN 11111111 MAX 99999999")
diff --git a/tests/integration/test_settings_profile/test.py b/tests/integration/test_settings_profile/test.py
index 71a1d9aca54..f7901dc1fe6 100644
--- a/tests/integration/test_settings_profile/test.py
+++ b/tests/integration/test_settings_profile/test.py
@@ -7,7 +7,9 @@ instance = cluster.add_instance('instance')
 
 
 def system_settings_profile(profile_name):
-    return TSV(instance.query("SELECT name, storage, num_elements, apply_to_all, apply_to_list, apply_to_except FROM system.settings_profiles WHERE name='" + profile_name + "'"))
+    return TSV(instance.query(
+        "SELECT name, storage, num_elements, apply_to_all, apply_to_list, apply_to_except FROM system.settings_profiles WHERE name='" + profile_name + "'"))
+
 
 def system_settings_profile_elements(profile_name=None, user_name=None, role_name=None):
     where = ""
@@ -45,33 +47,46 @@ def reset_after_test():
 
 def test_smoke():
     # Set settings and constraints via CREATE SETTINGS PROFILE ... TO user 
-    instance.query("CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MIN 90000000 MAX 110000000 TO robin")
-    assert instance.query("SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MIN 90000000 MAX 110000000 TO robin\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "100000001\n"
-    assert "Setting max_memory_usage shouldn't be less than 90000000" in instance.query_and_get_error("SET max_memory_usage = 80000000", user="robin")
-    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error("SET max_memory_usage = 120000000", user="robin")
-    assert system_settings_profile("xyz") == [[ "xyz", "local directory", 1, 0, "['robin']", "[]" ]]
-    assert system_settings_profile_elements(profile_name="xyz") == [[ "xyz", "\N", "\N", 0, "max_memory_usage", 100000001, 90000000, 110000000, "\N", "\N" ]]
+    instance.query(
+        "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MIN 90000000 MAX 110000000 TO robin")
+    assert instance.query(
+        "SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MIN 90000000 MAX 110000000 TO robin\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "100000001\n"
+    assert "Setting max_memory_usage shouldn't be less than 90000000" in instance.query_and_get_error(
+        "SET max_memory_usage = 80000000", user="robin")
+    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error(
+        "SET max_memory_usage = 120000000", user="robin")
+    assert system_settings_profile("xyz") == [["xyz", "local directory", 1, 0, "['robin']", "[]"]]
+    assert system_settings_profile_elements(profile_name="xyz") == [
+        ["xyz", "\N", "\N", 0, "max_memory_usage", 100000001, 90000000, 110000000, "\N", "\N"]]
 
     instance.query("ALTER SETTINGS PROFILE xyz TO NONE")
-    assert instance.query("SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MIN 90000000 MAX 110000000\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "10000000000\n"
+    assert instance.query(
+        "SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MIN 90000000 MAX 110000000\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "10000000000\n"
     instance.query("SET max_memory_usage = 80000000", user="robin")
     instance.query("SET max_memory_usage = 120000000", user="robin")
-    assert system_settings_profile("xyz") == [[ "xyz", "local directory", 1, 0, "[]", "[]" ]]
+    assert system_settings_profile("xyz") == [["xyz", "local directory", 1, 0, "[]", "[]"]]
     assert system_settings_profile_elements(user_name="robin") == []
 
     # Set settings and constraints via CREATE USER ... SETTINGS PROFILE
     instance.query("ALTER USER robin SETTINGS PROFILE xyz")
     assert instance.query("SHOW CREATE USER robin") == "CREATE USER robin SETTINGS PROFILE xyz\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "100000001\n"
-    assert "Setting max_memory_usage shouldn't be less than 90000000" in instance.query_and_get_error("SET max_memory_usage = 80000000", user="robin")
-    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error("SET max_memory_usage = 120000000", user="robin")
-    assert system_settings_profile_elements(user_name="robin") == [[ "\N", "robin", "\N", 0, "\N", "\N", "\N", "\N", "\N", "xyz" ]]
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "100000001\n"
+    assert "Setting max_memory_usage shouldn't be less than 90000000" in instance.query_and_get_error(
+        "SET max_memory_usage = 80000000", user="robin")
+    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error(
+        "SET max_memory_usage = 120000000", user="robin")
+    assert system_settings_profile_elements(user_name="robin") == [
+        ["\N", "robin", "\N", 0, "\N", "\N", "\N", "\N", "\N", "xyz"]]
 
     instance.query("ALTER USER robin SETTINGS NONE")
     assert instance.query("SHOW CREATE USER robin") == "CREATE USER robin\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "10000000000\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "10000000000\n"
     instance.query("SET max_memory_usage = 80000000", user="robin")
     instance.query("SET max_memory_usage = 120000000", user="robin")
     assert system_settings_profile_elements(user_name="robin") == []
@@ -79,70 +94,95 @@ def test_smoke():
 
 def test_settings_from_granted_role():
     # Set settings and constraints via granted role
-    instance.query("CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MAX 110000000, max_ast_depth = 2000")
+    instance.query(
+        "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MAX 110000000, max_ast_depth = 2000")
     instance.query("CREATE ROLE worker SETTINGS PROFILE xyz")
     instance.query("GRANT worker TO robin")
-    assert instance.query("SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MAX 110000000, max_ast_depth = 2000\n"
+    assert instance.query(
+        "SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MAX 110000000, max_ast_depth = 2000\n"
     assert instance.query("SHOW CREATE ROLE worker") == "CREATE ROLE worker SETTINGS PROFILE xyz\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "100000001\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "100000001\n"
     assert instance.query("SELECT value FROM system.settings WHERE name = 'max_ast_depth'", user="robin") == "2000\n"
-    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error("SET max_memory_usage = 120000000", user="robin")
-    assert system_settings_profile("xyz") == [[ "xyz", "local directory", 2, 0, "[]", "[]" ]]
-    assert system_settings_profile_elements(profile_name="xyz") == [[ "xyz", "\N", "\N", 0, "max_memory_usage", 100000001, "\N", 110000000, "\N", "\N" ],
-                                                                    [ "xyz", "\N", "\N", 1, "max_ast_depth",    2000,      "\N", "\N",      "\N", "\N" ]]
-    assert system_settings_profile_elements(role_name="worker") == [[ "\N", "\N", "worker", 0, "\N", "\N", "\N", "\N", "\N", "xyz" ]]
+    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error(
+        "SET max_memory_usage = 120000000", user="robin")
+    assert system_settings_profile("xyz") == [["xyz", "local directory", 2, 0, "[]", "[]"]]
+    assert system_settings_profile_elements(profile_name="xyz") == [
+        ["xyz", "\N", "\N", 0, "max_memory_usage", 100000001, "\N", 110000000, "\N", "\N"],
+        ["xyz", "\N", "\N", 1, "max_ast_depth", 2000, "\N", "\N", "\N", "\N"]]
+    assert system_settings_profile_elements(role_name="worker") == [
+        ["\N", "\N", "worker", 0, "\N", "\N", "\N", "\N", "\N", "xyz"]]
 
     instance.query("REVOKE worker FROM robin")
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "10000000000\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "10000000000\n"
     instance.query("SET max_memory_usage = 120000000", user="robin")
 
     instance.query("ALTER ROLE worker SETTINGS NONE")
     instance.query("GRANT worker TO robin")
     assert instance.query("SHOW CREATE ROLE worker") == "CREATE ROLE worker\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "10000000000\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "10000000000\n"
     instance.query("SET max_memory_usage = 120000000", user="robin")
     assert system_settings_profile_elements(role_name="worker") == []
 
     # Set settings and constraints via CREATE SETTINGS PROFILE ... TO granted role
     instance.query("ALTER SETTINGS PROFILE xyz TO worker")
-    assert instance.query("SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MAX 110000000, max_ast_depth = 2000 TO worker\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "100000001\n"
-    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error("SET max_memory_usage = 120000000", user="robin")
-    assert system_settings_profile("xyz") == [[ "xyz", "local directory", 2, 0, "['worker']", "[]" ]]
+    assert instance.query(
+        "SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MAX 110000000, max_ast_depth = 2000 TO worker\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "100000001\n"
+    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error(
+        "SET max_memory_usage = 120000000", user="robin")
+    assert system_settings_profile("xyz") == [["xyz", "local directory", 2, 0, "['worker']", "[]"]]
 
     instance.query("ALTER SETTINGS PROFILE xyz TO NONE")
-    assert instance.query("SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MAX 110000000, max_ast_depth = 2000\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "10000000000\n"
+    assert instance.query(
+        "SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000001 MAX 110000000, max_ast_depth = 2000\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "10000000000\n"
     instance.query("SET max_memory_usage = 120000000", user="robin")
-    assert system_settings_profile("xyz") == [[ "xyz", "local directory", 2, 0, "[]", "[]" ]]
+    assert system_settings_profile("xyz") == [["xyz", "local directory", 2, 0, "[]", "[]"]]
 
 
 def test_inheritance():
     instance.query("CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000002 READONLY")
     instance.query("CREATE SETTINGS PROFILE alpha SETTINGS PROFILE xyz TO robin")
-    assert instance.query("SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000002 READONLY\n"
-    assert instance.query("SHOW CREATE SETTINGS PROFILE alpha") == "CREATE SETTINGS PROFILE alpha SETTINGS INHERIT xyz TO robin\n"
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "100000002\n"
-    assert "Setting max_memory_usage should not be changed" in instance.query_and_get_error("SET max_memory_usage = 80000000", user="robin")
+    assert instance.query(
+        "SHOW CREATE SETTINGS PROFILE xyz") == "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000002 READONLY\n"
+    assert instance.query(
+        "SHOW CREATE SETTINGS PROFILE alpha") == "CREATE SETTINGS PROFILE alpha SETTINGS INHERIT xyz TO robin\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "100000002\n"
+    assert "Setting max_memory_usage should not be changed" in instance.query_and_get_error(
+        "SET max_memory_usage = 80000000", user="robin")
 
-    assert system_settings_profile("xyz") == [[ "xyz", "local directory", 1, 0, "[]", "[]" ]]
-    assert system_settings_profile_elements(profile_name="xyz") == [[ "xyz", "\N", "\N", 0, "max_memory_usage", 100000002, "\N", "\N", 1, "\N" ]]
-    assert system_settings_profile("alpha") == [[ "alpha", "local directory", 1, 0, "['robin']", "[]" ]]
-    assert system_settings_profile_elements(profile_name="alpha") == [[ "alpha", "\N", "\N", 0, "\N", "\N", "\N", "\N", "\N", "xyz" ]]
+    assert system_settings_profile("xyz") == [["xyz", "local directory", 1, 0, "[]", "[]"]]
+    assert system_settings_profile_elements(profile_name="xyz") == [
+        ["xyz", "\N", "\N", 0, "max_memory_usage", 100000002, "\N", "\N", 1, "\N"]]
+    assert system_settings_profile("alpha") == [["alpha", "local directory", 1, 0, "['robin']", "[]"]]
+    assert system_settings_profile_elements(profile_name="alpha") == [
+        ["alpha", "\N", "\N", 0, "\N", "\N", "\N", "\N", "\N", "xyz"]]
     assert system_settings_profile_elements(user_name="robin") == []
 
 
 def test_alter_and_drop():
-    instance.query("CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000003 MIN 90000000 MAX 110000000 TO robin")
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "100000003\n"
-    assert "Setting max_memory_usage shouldn't be less than 90000000" in instance.query_and_get_error("SET max_memory_usage = 80000000", user="robin")
-    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error("SET max_memory_usage = 120000000", user="robin")
+    instance.query(
+        "CREATE SETTINGS PROFILE xyz SETTINGS max_memory_usage = 100000003 MIN 90000000 MAX 110000000 TO robin")
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "100000003\n"
+    assert "Setting max_memory_usage shouldn't be less than 90000000" in instance.query_and_get_error(
+        "SET max_memory_usage = 80000000", user="robin")
+    assert "Setting max_memory_usage shouldn't be greater than 110000000" in instance.query_and_get_error(
+        "SET max_memory_usage = 120000000", user="robin")
 
     instance.query("ALTER SETTINGS PROFILE xyz SETTINGS readonly=1")
-    assert "Cannot modify 'max_memory_usage' setting in readonly mode" in instance.query_and_get_error("SET max_memory_usage = 80000000", user="robin")
+    assert "Cannot modify 'max_memory_usage' setting in readonly mode" in instance.query_and_get_error(
+        "SET max_memory_usage = 80000000", user="robin")
 
     instance.query("DROP SETTINGS PROFILE xyz")
-    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'", user="robin") == "10000000000\n"
+    assert instance.query("SELECT value FROM system.settings WHERE name = 'max_memory_usage'",
+                          user="robin") == "10000000000\n"
     instance.query("SET max_memory_usage = 80000000", user="robin")
     instance.query("SET max_memory_usage = 120000000", user="robin")
 
@@ -151,25 +191,29 @@ def test_show_profiles():
     instance.query("CREATE SETTINGS PROFILE xyz")
     assert instance.query("SHOW SETTINGS PROFILES") == "default\nreadonly\nxyz\n"
     assert instance.query("SHOW PROFILES") == "default\nreadonly\nxyz\n"
-    
+
     assert instance.query("SHOW CREATE PROFILE xyz") == "CREATE SETTINGS PROFILE xyz\n"
-    assert instance.query("SHOW CREATE SETTINGS PROFILE default") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, use_uncompressed_cache = 0, load_balancing = \\'random\\'\n"
-    assert instance.query("SHOW CREATE PROFILES") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, use_uncompressed_cache = 0, load_balancing = \\'random\\'\n"\
-                                                     "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"\
-                                                     "CREATE SETTINGS PROFILE xyz\n"
-    
-    expected_access = "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, use_uncompressed_cache = 0, load_balancing = \\'random\\'\n"\
-                      "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"\
+    assert instance.query(
+        "SHOW CREATE SETTINGS PROFILE default") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, use_uncompressed_cache = 0, load_balancing = \\'random\\'\n"
+    assert instance.query(
+        "SHOW CREATE PROFILES") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, use_uncompressed_cache = 0, load_balancing = \\'random\\'\n" \
+                                   "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n" \
+                                   "CREATE SETTINGS PROFILE xyz\n"
+
+    expected_access = "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, use_uncompressed_cache = 0, load_balancing = \\'random\\'\n" \
+                      "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n" \
                       "CREATE SETTINGS PROFILE xyz\n"
     assert expected_access in instance.query("SHOW ACCESS")
 
 
 def test_allow_ddl():
     assert "Not enough privileges" in instance.query_and_get_error("CREATE TABLE tbl(a Int32) ENGINE=Log", user="robin")
-    assert "DDL queries are prohibited" in instance.query_and_get_error("CREATE TABLE tbl(a Int32) ENGINE=Log", settings={"allow_ddl":0})
+    assert "DDL queries are prohibited" in instance.query_and_get_error("CREATE TABLE tbl(a Int32) ENGINE=Log",
+                                                                        settings={"allow_ddl": 0})
 
     assert "Not enough privileges" in instance.query_and_get_error("GRANT CREATE ON tbl TO robin", user="robin")
-    assert "DDL queries are prohibited" in instance.query_and_get_error("GRANT CREATE ON tbl TO robin", settings={"allow_ddl":0})
+    assert "DDL queries are prohibited" in instance.query_and_get_error("GRANT CREATE ON tbl TO robin",
+                                                                        settings={"allow_ddl": 0})
 
     instance.query("GRANT CREATE ON tbl TO robin")
     instance.query("CREATE TABLE tbl(a Int32) ENGINE=Log", user="robin")
@@ -179,14 +223,16 @@ def test_allow_ddl():
 def test_allow_introspection():
     assert "Introspection functions are disabled" in instance.query_and_get_error("SELECT demangle('a')")
     assert "Not enough privileges" in instance.query_and_get_error("SELECT demangle('a')", user="robin")
-    assert "Not enough privileges" in instance.query_and_get_error("SELECT demangle('a')", user="robin", settings={"allow_introspection_functions":1})
+    assert "Not enough privileges" in instance.query_and_get_error("SELECT demangle('a')", user="robin",
+                                                                   settings={"allow_introspection_functions": 1})
 
     assert "Introspection functions are disabled" in instance.query_and_get_error("GRANT demangle ON *.* TO robin")
     assert "Not enough privileges" in instance.query_and_get_error("GRANT demangle ON *.* TO robin", user="robin")
-    assert "Not enough privileges" in instance.query_and_get_error("GRANT demangle ON *.* TO robin", user="robin", settings={"allow_introspection_functions":1})
+    assert "Not enough privileges" in instance.query_and_get_error("GRANT demangle ON *.* TO robin", user="robin",
+                                                                   settings={"allow_introspection_functions": 1})
 
-    assert instance.query("SELECT demangle('a')", settings={"allow_introspection_functions":1}) == "signed char\n"
-    instance.query("GRANT demangle ON *.* TO robin", settings={"allow_introspection_functions":1})
+    assert instance.query("SELECT demangle('a')", settings={"allow_introspection_functions": 1}) == "signed char\n"
+    instance.query("GRANT demangle ON *.* TO robin", settings={"allow_introspection_functions": 1})
 
     assert "Introspection functions are disabled" in instance.query_and_get_error("SELECT demangle('a')", user="robin")
     instance.query("ALTER USER robin SETTINGS allow_introspection_functions=1")
@@ -201,5 +247,5 @@ def test_allow_introspection():
     instance.query("DROP SETTINGS PROFILE xyz")
     assert "Introspection functions are disabled" in instance.query_and_get_error("SELECT demangle('a')", user="robin")
 
-    instance.query("REVOKE demangle ON *.* FROM robin", settings={"allow_introspection_functions":1})
+    instance.query("REVOKE demangle ON *.* FROM robin", settings={"allow_introspection_functions": 1})
     assert "Not enough privileges" in instance.query_and_get_error("SELECT demangle('a')", user="robin")
diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index 20613bde1bc..ed2a4e0140d 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -1,19 +1,14 @@
-import time
-import pytest
-import requests
-from tempfile import NamedTemporaryFile
-from helpers.hdfs_api import HDFSApi
-
 import os
 
+import pytest
 from helpers.cluster import ClickHouseCluster
-import subprocess
-
+from helpers.hdfs_api import HDFSApi
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', with_hdfs=True, user_configs=[], main_configs=['configs/log_conf.xml'])
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -27,21 +22,28 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_read_write_storage(started_cluster):
     hdfs_api = HDFSApi("root")
 
-    node1.query("create table SimpleHDFSStorage (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/simple_storage', 'TSV')")
+    node1.query(
+        "create table SimpleHDFSStorage (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/simple_storage', 'TSV')")
     node1.query("insert into SimpleHDFSStorage values (1, 'Mark', 72.53)")
     assert hdfs_api.read_data("/simple_storage") == "1\tMark\t72.53\n"
     assert node1.query("select * from SimpleHDFSStorage") == "1\tMark\t72.53\n"
 
+
 def test_read_write_storage_with_globs(started_cluster):
     hdfs_api = HDFSApi("root")
 
-    node1.query("create table HDFSStorageWithRange (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage{1..5}', 'TSV')")
-    node1.query("create table HDFSStorageWithEnum (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage{1,2,3,4,5}', 'TSV')")
-    node1.query("create table HDFSStorageWithQuestionMark (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage?', 'TSV')")
-    node1.query("create table HDFSStorageWithAsterisk (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage*', 'TSV')")
+    node1.query(
+        "create table HDFSStorageWithRange (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage{1..5}', 'TSV')")
+    node1.query(
+        "create table HDFSStorageWithEnum (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage{1,2,3,4,5}', 'TSV')")
+    node1.query(
+        "create table HDFSStorageWithQuestionMark (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage?', 'TSV')")
+    node1.query(
+        "create table HDFSStorageWithAsterisk (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage*', 'TSV')")
 
     for i in ["1", "2", "3"]:
         hdfs_api.write_data("/storage" + i, i + "\tMark\t72.53\n")
@@ -73,6 +75,7 @@ def test_read_write_storage_with_globs(started_cluster):
         print ex
         assert "in readonly mode" in str(ex)
 
+
 def test_read_write_table(started_cluster):
     hdfs_api = HDFSApi("root")
     data = "1\tSerialize\t555.222\n2\tData\t777.333\n"
@@ -80,42 +83,50 @@ def test_read_write_table(started_cluster):
 
     assert hdfs_api.read_data("/simple_table_function") == data
 
-    assert node1.query("select * from hdfs('hdfs://hdfs1:9000/simple_table_function', 'TSV', 'id UInt64, text String, number Float64')") == data
+    assert node1.query(
+        "select * from hdfs('hdfs://hdfs1:9000/simple_table_function', 'TSV', 'id UInt64, text String, number Float64')") == data
 
 
 def test_write_table(started_cluster):
     hdfs_api = HDFSApi("root")
 
-    node1.query("create table OtherHDFSStorage (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/other_storage', 'TSV')")
+    node1.query(
+        "create table OtherHDFSStorage (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/other_storage', 'TSV')")
     node1.query("insert into OtherHDFSStorage values (10, 'tomas', 55.55), (11, 'jack', 32.54)")
 
     result = "10\ttomas\t55.55\n11\tjack\t32.54\n"
     assert hdfs_api.read_data("/other_storage") == result
     assert node1.query("select * from OtherHDFSStorage order by id") == result
 
+
 def test_bad_hdfs_uri(started_cluster):
     try:
-        node1.query("create table BadStorage1 (id UInt32, name String, weight Float64) ENGINE = HDFS('hads:hgsdfs100500:9000/other_storage', 'TSV')")
+        node1.query(
+            "create table BadStorage1 (id UInt32, name String, weight Float64) ENGINE = HDFS('hads:hgsdfs100500:9000/other_storage', 'TSV')")
     except Exception as ex:
         print ex
         assert "Illegal HDFS URI" in str(ex)
     try:
-        node1.query("create table BadStorage2 (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs100500:9000/other_storage', 'TSV')")
+        node1.query(
+            "create table BadStorage2 (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs100500:9000/other_storage', 'TSV')")
     except Exception as ex:
         print ex
         assert "Unable to create builder to connect to HDFS" in str(ex)
 
     try:
-        node1.query("create table BadStorage3 (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/<>', 'TSV')")
+        node1.query(
+            "create table BadStorage3 (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/<>', 'TSV')")
     except Exception as ex:
         print ex
         assert "Unable to open HDFS file" in str(ex)
 
+
 def test_globs_in_read_table(started_cluster):
     hdfs_api = HDFSApi("root")
     some_data = "1\tSerialize\t555.222\n2\tData\t777.333\n"
     globs_dir = "/dir_for_test_with_globs/"
-    files = ["dir1/dir_dir/file1", "dir2/file2", "simple_table_function", "dir/file", "some_dir/dir1/file", "some_dir/dir2/file", "some_dir/file", "table1_function", "table2_function", "table3_function"]
+    files = ["dir1/dir_dir/file1", "dir2/file2", "simple_table_function", "dir/file", "some_dir/dir1/file",
+             "some_dir/dir2/file", "some_dir/file", "table1_function", "table2_function", "table3_function"]
     for filename in files:
         hdfs_api.write_data(globs_dir + filename, some_data)
 
@@ -135,8 +146,11 @@ def test_globs_in_read_table(started_cluster):
     for pattern, paths_amount, files_amount in test_requests:
         inside_table_func = "'hdfs://hdfs1:9000" + globs_dir + pattern + "', 'TSV', 'id UInt64, text String, number Float64'"
         assert node1.query("select * from hdfs(" + inside_table_func + ")") == paths_amount * some_data
-        assert node1.query("select count(distinct _path) from hdfs(" + inside_table_func + ")").rstrip() == str(paths_amount)
-        assert node1.query("select count(distinct _file) from hdfs(" + inside_table_func + ")").rstrip() == str(files_amount)
+        assert node1.query("select count(distinct _path) from hdfs(" + inside_table_func + ")").rstrip() == str(
+            paths_amount)
+        assert node1.query("select count(distinct _file) from hdfs(" + inside_table_func + ")").rstrip() == str(
+            files_amount)
+
 
 def test_read_write_gzip_table(started_cluster):
     hdfs_api = HDFSApi("root")
@@ -145,7 +159,9 @@ def test_read_write_gzip_table(started_cluster):
 
     assert hdfs_api.read_gzip_data("/simple_table_function.gz") == data
 
-    assert node1.query("select * from hdfs('hdfs://hdfs1:9000/simple_table_function.gz', 'TSV', 'id UInt64, text String, number Float64')") == data
+    assert node1.query(
+        "select * from hdfs('hdfs://hdfs1:9000/simple_table_function.gz', 'TSV', 'id UInt64, text String, number Float64')") == data
+
 
 def test_read_write_gzip_table_with_parameter_gzip(started_cluster):
     hdfs_api = HDFSApi("root")
@@ -154,7 +170,9 @@ def test_read_write_gzip_table_with_parameter_gzip(started_cluster):
 
     assert hdfs_api.read_gzip_data("/simple_table_function") == data
 
-    assert node1.query("select * from hdfs('hdfs://hdfs1:9000/simple_table_function', 'TSV', 'id UInt64, text String, number Float64', 'gzip')") == data
+    assert node1.query(
+        "select * from hdfs('hdfs://hdfs1:9000/simple_table_function', 'TSV', 'id UInt64, text String, number Float64', 'gzip')") == data
+
 
 def test_read_write_table_with_parameter_none(started_cluster):
     hdfs_api = HDFSApi("root")
@@ -163,7 +181,9 @@ def test_read_write_table_with_parameter_none(started_cluster):
 
     assert hdfs_api.read_data("/simple_table_function.gz") == data
 
-    assert node1.query("select * from hdfs('hdfs://hdfs1:9000/simple_table_function.gz', 'TSV', 'id UInt64, text String, number Float64', 'none')") == data
+    assert node1.query(
+        "select * from hdfs('hdfs://hdfs1:9000/simple_table_function.gz', 'TSV', 'id UInt64, text String, number Float64', 'none')") == data
+
 
 def test_read_write_gzip_table_with_parameter_auto_gz(started_cluster):
     hdfs_api = HDFSApi("root")
@@ -172,20 +192,25 @@ def test_read_write_gzip_table_with_parameter_auto_gz(started_cluster):
 
     assert hdfs_api.read_gzip_data("/simple_table_function.gz") == data
 
-    assert node1.query("select * from hdfs('hdfs://hdfs1:9000/simple_table_function.gz', 'TSV', 'id UInt64, text String, number Float64', 'auto')") == data
+    assert node1.query(
+        "select * from hdfs('hdfs://hdfs1:9000/simple_table_function.gz', 'TSV', 'id UInt64, text String, number Float64', 'auto')") == data
+
 
 def test_write_gz_storage(started_cluster):
     hdfs_api = HDFSApi("root")
 
-    node1.query("create table GZHDFSStorage (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage.gz', 'TSV')")
+    node1.query(
+        "create table GZHDFSStorage (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/storage.gz', 'TSV')")
     node1.query("insert into GZHDFSStorage values (1, 'Mark', 72.53)")
     assert hdfs_api.read_gzip_data("/storage.gz") == "1\tMark\t72.53\n"
     assert node1.query("select * from GZHDFSStorage") == "1\tMark\t72.53\n"
 
+
 def test_write_gzip_storage(started_cluster):
     hdfs_api = HDFSApi("root")
 
-    node1.query("create table GZIPHDFSStorage (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/gzip_storage', 'TSV', 'gzip')")
+    node1.query(
+        "create table GZIPHDFSStorage (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://hdfs1:9000/gzip_storage', 'TSV', 'gzip')")
     node1.query("insert into GZIPHDFSStorage values (1, 'Mark', 72.53)")
     assert hdfs_api.read_gzip_data("/gzip_storage") == "1\tMark\t72.53\n"
     assert node1.query("select * from GZIPHDFSStorage") == "1\tMark\t72.53\n"
diff --git a/tests/integration/test_storage_kafka/kafka_pb2.py b/tests/integration/test_storage_kafka/kafka_pb2.py
index 79890682125..a9dcab1a85a 100644
--- a/tests/integration/test_storage_kafka/kafka_pb2.py
+++ b/tests/integration/test_storage_kafka/kafka_pb2.py
@@ -2,75 +2,70 @@
 # source: clickhouse_path/format_schemas/kafka.proto
 
 import sys
-_b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1'))
+
+_b = sys.version_info[0] < 3 and (lambda x: x) or (lambda x: x.encode('latin1'))
 from google.protobuf import descriptor as _descriptor
 from google.protobuf import message as _message
 from google.protobuf import reflection as _reflection
 from google.protobuf import symbol_database as _symbol_database
-from google.protobuf import descriptor_pb2
+
 # @@protoc_insertion_point(imports)
 
 _sym_db = _symbol_database.Default()
 
-
-
-
 DESCRIPTOR = _descriptor.FileDescriptor(
-  name='clickhouse_path/format_schemas/kafka.proto',
-  package='',
-  syntax='proto3',
-  serialized_pb=_b('\n*clickhouse_path/format_schemas/kafka.proto\"*\n\x0cKeyValuePair\x12\x0b\n\x03key\x18\x01 \x01(\x04\x12\r\n\x05value\x18\x02 \x01(\tb\x06proto3')
+    name='clickhouse_path/format_schemas/kafka.proto',
+    package='',
+    syntax='proto3',
+    serialized_pb=_b(
+        '\n*clickhouse_path/format_schemas/kafka.proto\"*\n\x0cKeyValuePair\x12\x0b\n\x03key\x18\x01 \x01(\x04\x12\r\n\x05value\x18\x02 \x01(\tb\x06proto3')
 )
 _sym_db.RegisterFileDescriptor(DESCRIPTOR)
 
-
-
-
 _KEYVALUEPAIR = _descriptor.Descriptor(
-  name='KeyValuePair',
-  full_name='KeyValuePair',
-  filename=None,
-  file=DESCRIPTOR,
-  containing_type=None,
-  fields=[
-    _descriptor.FieldDescriptor(
-      name='key', full_name='KeyValuePair.key', index=0,
-      number=1, type=4, cpp_type=4, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-    _descriptor.FieldDescriptor(
-      name='value', full_name='KeyValuePair.value', index=1,
-      number=2, type=9, cpp_type=9, label=1,
-      has_default_value=False, default_value=_b("").decode('utf-8'),
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      options=None),
-  ],
-  extensions=[
-  ],
-  nested_types=[],
-  enum_types=[
-  ],
-  options=None,
-  is_extendable=False,
-  syntax='proto3',
-  extension_ranges=[],
-  oneofs=[
-  ],
-  serialized_start=46,
-  serialized_end=88,
+    name='KeyValuePair',
+    full_name='KeyValuePair',
+    filename=None,
+    file=DESCRIPTOR,
+    containing_type=None,
+    fields=[
+        _descriptor.FieldDescriptor(
+            name='key', full_name='KeyValuePair.key', index=0,
+            number=1, type=4, cpp_type=4, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+        _descriptor.FieldDescriptor(
+            name='value', full_name='KeyValuePair.value', index=1,
+            number=2, type=9, cpp_type=9, label=1,
+            has_default_value=False, default_value=_b("").decode('utf-8'),
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            options=None),
+    ],
+    extensions=[
+    ],
+    nested_types=[],
+    enum_types=[
+    ],
+    options=None,
+    is_extendable=False,
+    syntax='proto3',
+    extension_ranges=[],
+    oneofs=[
+    ],
+    serialized_start=46,
+    serialized_end=88,
 )
 
 DESCRIPTOR.message_types_by_name['KeyValuePair'] = _KEYVALUEPAIR
 
 KeyValuePair = _reflection.GeneratedProtocolMessageType('KeyValuePair', (_message.Message,), dict(
-  DESCRIPTOR = _KEYVALUEPAIR,
-  __module__ = 'clickhouse_path.format_schemas.kafka_pb2'
-  # @@protoc_insertion_point(class_scope:KeyValuePair)
-  ))
+    DESCRIPTOR=_KEYVALUEPAIR,
+    __module__='clickhouse_path.format_schemas.kafka_pb2'
+    # @@protoc_insertion_point(class_scope:KeyValuePair)
+))
 _sym_db.RegisterMessage(KeyValuePair)
 
-
 # @@protoc_insertion_point(module_scope)
diff --git a/tests/integration/test_storage_kafka/test.py b/tests/integration/test_storage_kafka/test.py
index 8f605e1bbd4..90422bf98e9 100644
--- a/tests/integration/test_storage_kafka/test.py
+++ b/tests/integration/test_storage_kafka/test.py
@@ -1,29 +1,25 @@
+import json
 import os.path as p
 import random
+import socket
+import subprocess
 import threading
 import time
-import pytest
-import io
-
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
-from helpers.client import QueryRuntimeException
-from helpers.network import PartitionManager
-
-import json
-import subprocess
-import kafka.errors
-from kafka import KafkaAdminClient, KafkaProducer, KafkaConsumer, BrokerConnection
-from kafka.admin import NewTopic
-from kafka.protocol.admin import DescribeGroupsResponse_v1, DescribeGroupsRequest_v1
-from kafka.protocol.group import MemberAssignment
 
 import avro.schema
+import kafka.errors
+import pytest
 from confluent.schemaregistry.client import CachedSchemaRegistryClient
 from confluent.schemaregistry.serializers.MessageSerializer import MessageSerializer
-
-import socket
 from google.protobuf.internal.encoder import _VarintBytes
+from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
+from helpers.network import PartitionManager
+from helpers.test_tools import TSV
+from kafka import KafkaAdminClient, KafkaProducer, KafkaConsumer, BrokerConnection
+from kafka.admin import NewTopic
+from kafka.protocol.admin import DescribeGroupsRequest_v1
+from kafka.protocol.group import MemberAssignment
 
 """
 protoc --version
@@ -34,13 +30,12 @@ protoc --python_out=. kafka.proto
 """
 import kafka_pb2
 
-
 # TODO: add test for run-time offset update in CH, if we manually update it on Kafka side.
 # TODO: add test for SELECT LIMIT is working.
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance',
-                                main_configs=['configs/kafka.xml', 'configs/log_conf.xml', 'configs/kafka_macros.xml' ],
+                                main_configs=['configs/kafka.xml', 'configs/log_conf.xml', 'configs/kafka_macros.xml'],
                                 with_kafka=True,
                                 with_zookeeper=True,
                                 clickhouse_path_dir='clickhouse_path')
@@ -80,6 +75,8 @@ def kafka_produce(topic, messages, timestamp=None):
     for message in messages:
         producer.send(topic=topic, value=message, timestamp_ms=timestamp)
         producer.flush()
+
+
 #    print ("Produced {} messages for topic {}".format(len(messages), topic))
 
 
@@ -107,6 +104,7 @@ def kafka_produce_protobuf_messages(topic, start_index, num_messages):
     producer.flush()
     print("Produced {} messages for topic {}".format(num_messages, topic))
 
+
 def avro_confluent_message(schema_registry_client, value):
     # type: (CachedSchemaRegistryClient, dict) -> str
 
@@ -124,9 +122,11 @@ def avro_confluent_message(schema_registry_client, value):
     })
     return serializer.encode_record_with_schema('test_subject', schema, value)
 
+
 @pytest.mark.timeout(180)
 def test_kafka_json_as_string(kafka_cluster):
-    kafka_produce('kafka_json_as_string', ['{"t": 123, "e": {"x": "woof"} }', '', '{"t": 124, "e": {"x": "test"} }', '{"F1":"V1","F2":{"F21":"V21","F22":{},"F23":"V23","F24":"2019-12-24T16:28:04"},"F3":"V3"}'])
+    kafka_produce('kafka_json_as_string', ['{"t": 123, "e": {"x": "woof"} }', '', '{"t": 124, "e": {"x": "test"} }',
+                                           '{"F1":"V1","F2":{"F21":"V21","F22":{},"F23":"V23","F24":"2019-12-24T16:28:04"},"F3":"V3"}'])
 
     instance.query('''
         CREATE TABLE test.kafka (field String)
@@ -145,7 +145,9 @@ def test_kafka_json_as_string(kafka_cluster):
 {"F1":"V1","F2":{"F21":"V21","F22":{},"F23":"V23","F24":"2019-12-24T16:28:04"},"F3":"V3"}
 '''
     assert TSV(result) == TSV(expected)
-    assert instance.contains_in_log("Parsing of message (topic: kafka_json_as_string, partition: 0, offset: 1) return no rows")
+    assert instance.contains_in_log(
+        "Parsing of message (topic: kafka_json_as_string, partition: 0, offset: 1) return no rows")
+
 
 @pytest.mark.timeout(300)
 def test_kafka_formats(kafka_cluster):
@@ -155,8 +157,8 @@ def test_kafka_formats(kafka_cluster):
     all_formats = {
         ## Text formats ##
         # dumped with clickhouse-client ... | perl -pe 's/\n/\\n/; s/\t/\\t/g;'
-        'JSONEachRow' : {
-            'data_sample' : [
+        'JSONEachRow': {
+            'data_sample': [
                 '{"id":"0","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n',
                 '{"id":"1","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"2","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"3","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"4","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"5","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"6","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"7","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"8","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"9","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"10","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"11","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"12","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"13","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"14","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n{"id":"15","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n',
                 '{"id":"0","blockNo":0,"val1":"AM","val2":0.5,"val3":1}\n',
@@ -164,16 +166,16 @@ def test_kafka_formats(kafka_cluster):
             'supports_empty_value': True,
         },
         # JSONAsString doesn't fit to that test, and tested separately
-        'JSONCompactEachRow' : {
-            'data_sample' : [
+        'JSONCompactEachRow': {
+            'data_sample': [
                 '["0", 0, "AM", 0.5, 1]\n',
                 '["1", 0, "AM", 0.5, 1]\n["2", 0, "AM", 0.5, 1]\n["3", 0, "AM", 0.5, 1]\n["4", 0, "AM", 0.5, 1]\n["5", 0, "AM", 0.5, 1]\n["6", 0, "AM", 0.5, 1]\n["7", 0, "AM", 0.5, 1]\n["8", 0, "AM", 0.5, 1]\n["9", 0, "AM", 0.5, 1]\n["10", 0, "AM", 0.5, 1]\n["11", 0, "AM", 0.5, 1]\n["12", 0, "AM", 0.5, 1]\n["13", 0, "AM", 0.5, 1]\n["14", 0, "AM", 0.5, 1]\n["15", 0, "AM", 0.5, 1]\n',
                 '["0", 0, "AM", 0.5, 1]\n',
             ],
             'supports_empty_value': True,
         },
-        'JSONCompactEachRowWithNamesAndTypes' : {
-            'data_sample' : [
+        'JSONCompactEachRowWithNamesAndTypes': {
+            'data_sample': [
                 '["id", "blockNo", "val1", "val2", "val3"]\n["Int64", "UInt16", "String", "Float32", "UInt8"]\n["0", 0, "AM", 0.5, 1]\n',
                 '["id", "blockNo", "val1", "val2", "val3"]\n["Int64", "UInt16", "String", "Float32", "UInt8"]\n["1", 0, "AM", 0.5, 1]\n["2", 0, "AM", 0.5, 1]\n["3", 0, "AM", 0.5, 1]\n["4", 0, "AM", 0.5, 1]\n["5", 0, "AM", 0.5, 1]\n["6", 0, "AM", 0.5, 1]\n["7", 0, "AM", 0.5, 1]\n["8", 0, "AM", 0.5, 1]\n["9", 0, "AM", 0.5, 1]\n["10", 0, "AM", 0.5, 1]\n["11", 0, "AM", 0.5, 1]\n["12", 0, "AM", 0.5, 1]\n["13", 0, "AM", 0.5, 1]\n["14", 0, "AM", 0.5, 1]\n["15", 0, "AM", 0.5, 1]\n',
                 '["id", "blockNo", "val1", "val2", "val3"]\n["Int64", "UInt16", "String", "Float32", "UInt8"]\n["0", 0, "AM", 0.5, 1]\n',
@@ -184,8 +186,8 @@ def test_kafka_formats(kafka_cluster):
                 # /src/Processors/Formats/IRowInputFormat.cpp:0: DB::IRowInputFormat::generate() @ 0x1de72710 in /usr/bin/clickhouse
             ],
         },
-        'TSKV' : {
-            'data_sample' : [
+        'TSKV': {
+            'data_sample': [
                 'id=0\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\n',
                 'id=1\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=2\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=3\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=4\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=5\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=6\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=7\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=8\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=9\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=10\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=11\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=12\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=13\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=14\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\nid=15\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\n',
                 'id=0\tblockNo=0\tval1=AM\tval2=0.5\tval3=1\n',
@@ -196,24 +198,24 @@ def test_kafka_formats(kafka_cluster):
                 # /src/Processors/Formats/IRowInputFormat.cpp:64: DB::IRowInputFormat::generate() @ 0x1de727cf in /usr/bin/clickhouse
             ],
         },
-        'CSV' : {
-            'data_sample' : [
+        'CSV': {
+            'data_sample': [
                 '0,0,"AM",0.5,1\n',
                 '1,0,"AM",0.5,1\n2,0,"AM",0.5,1\n3,0,"AM",0.5,1\n4,0,"AM",0.5,1\n5,0,"AM",0.5,1\n6,0,"AM",0.5,1\n7,0,"AM",0.5,1\n8,0,"AM",0.5,1\n9,0,"AM",0.5,1\n10,0,"AM",0.5,1\n11,0,"AM",0.5,1\n12,0,"AM",0.5,1\n13,0,"AM",0.5,1\n14,0,"AM",0.5,1\n15,0,"AM",0.5,1\n',
                 '0,0,"AM",0.5,1\n',
             ],
             'supports_empty_value': True,
         },
-        'TSV' : {
-            'data_sample' : [
+        'TSV': {
+            'data_sample': [
                 '0\t0\tAM\t0.5\t1\n',
                 '1\t0\tAM\t0.5\t1\n2\t0\tAM\t0.5\t1\n3\t0\tAM\t0.5\t1\n4\t0\tAM\t0.5\t1\n5\t0\tAM\t0.5\t1\n6\t0\tAM\t0.5\t1\n7\t0\tAM\t0.5\t1\n8\t0\tAM\t0.5\t1\n9\t0\tAM\t0.5\t1\n10\t0\tAM\t0.5\t1\n11\t0\tAM\t0.5\t1\n12\t0\tAM\t0.5\t1\n13\t0\tAM\t0.5\t1\n14\t0\tAM\t0.5\t1\n15\t0\tAM\t0.5\t1\n',
                 '0\t0\tAM\t0.5\t1\n',
             ],
             'supports_empty_value': True,
         },
-        'CSVWithNames' : {
-            'data_sample' : [
+        'CSVWithNames': {
+            'data_sample': [
                 '"id","blockNo","val1","val2","val3"\n0,0,"AM",0.5,1\n',
                 '"id","blockNo","val1","val2","val3"\n1,0,"AM",0.5,1\n2,0,"AM",0.5,1\n3,0,"AM",0.5,1\n4,0,"AM",0.5,1\n5,0,"AM",0.5,1\n6,0,"AM",0.5,1\n7,0,"AM",0.5,1\n8,0,"AM",0.5,1\n9,0,"AM",0.5,1\n10,0,"AM",0.5,1\n11,0,"AM",0.5,1\n12,0,"AM",0.5,1\n13,0,"AM",0.5,1\n14,0,"AM",0.5,1\n15,0,"AM",0.5,1\n',
                 '"id","blockNo","val1","val2","val3"\n0,0,"AM",0.5,1\n',
@@ -227,24 +229,24 @@ def test_kafka_formats(kafka_cluster):
                 # /src/Processors/ISource.cpp:48: DB::ISource::work() @ 0x1dd79737 in /usr/bin/clickhouse
             ],
         },
-        'Values' : {
-            'data_sample' : [
+        'Values': {
+            'data_sample': [
                 "(0,0,'AM',0.5,1)",
                 "(1,0,'AM',0.5,1),(2,0,'AM',0.5,1),(3,0,'AM',0.5,1),(4,0,'AM',0.5,1),(5,0,'AM',0.5,1),(6,0,'AM',0.5,1),(7,0,'AM',0.5,1),(8,0,'AM',0.5,1),(9,0,'AM',0.5,1),(10,0,'AM',0.5,1),(11,0,'AM',0.5,1),(12,0,'AM',0.5,1),(13,0,'AM',0.5,1),(14,0,'AM',0.5,1),(15,0,'AM',0.5,1)",
                 "(0,0,'AM',0.5,1)",
             ],
             'supports_empty_value': True,
         },
-        'TSVWithNames' : {
-            'data_sample' : [
+        'TSVWithNames': {
+            'data_sample': [
                 'id\tblockNo\tval1\tval2\tval3\n0\t0\tAM\t0.5\t1\n',
                 'id\tblockNo\tval1\tval2\tval3\n1\t0\tAM\t0.5\t1\n2\t0\tAM\t0.5\t1\n3\t0\tAM\t0.5\t1\n4\t0\tAM\t0.5\t1\n5\t0\tAM\t0.5\t1\n6\t0\tAM\t0.5\t1\n7\t0\tAM\t0.5\t1\n8\t0\tAM\t0.5\t1\n9\t0\tAM\t0.5\t1\n10\t0\tAM\t0.5\t1\n11\t0\tAM\t0.5\t1\n12\t0\tAM\t0.5\t1\n13\t0\tAM\t0.5\t1\n14\t0\tAM\t0.5\t1\n15\t0\tAM\t0.5\t1\n',
                 'id\tblockNo\tval1\tval2\tval3\n0\t0\tAM\t0.5\t1\n',
             ],
             'supports_empty_value': True,
         },
-        'TSVWithNamesAndTypes' : {
-            'data_sample' : [
+        'TSVWithNamesAndTypes': {
+            'data_sample': [
                 'id\tblockNo\tval1\tval2\tval3\nInt64\tUInt16\tString\tFloat32\tUInt8\n0\t0\tAM\t0.5\t1\n',
                 'id\tblockNo\tval1\tval2\tval3\nInt64\tUInt16\tString\tFloat32\tUInt8\n1\t0\tAM\t0.5\t1\n2\t0\tAM\t0.5\t1\n3\t0\tAM\t0.5\t1\n4\t0\tAM\t0.5\t1\n5\t0\tAM\t0.5\t1\n6\t0\tAM\t0.5\t1\n7\t0\tAM\t0.5\t1\n8\t0\tAM\t0.5\t1\n9\t0\tAM\t0.5\t1\n10\t0\tAM\t0.5\t1\n11\t0\tAM\t0.5\t1\n12\t0\tAM\t0.5\t1\n13\t0\tAM\t0.5\t1\n14\t0\tAM\t0.5\t1\n15\t0\tAM\t0.5\t1\n',
                 'id\tblockNo\tval1\tval2\tval3\nInt64\tUInt16\tString\tFloat32\tUInt8\n0\t0\tAM\t0.5\t1\n',
@@ -266,8 +268,8 @@ def test_kafka_formats(kafka_cluster):
         #     ],
         #     'extra_settings': ", format_template_row='template_row.format'"
         # },
-        'Regexp' : {
-            'data_sample' : [
+        'Regexp': {
+            'data_sample': [
                 '(id = 0, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)',
                 '(id = 1, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 2, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 3, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 4, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 5, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 6, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 7, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 8, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 9, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 10, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 11, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 12, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 13, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 14, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)\n(id = 15, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)',
                 '(id = 0, blockNo = 0, val1 = "AM", val2 = 0.5, val3 = 1)',
@@ -281,7 +283,7 @@ def test_kafka_formats(kafka_cluster):
         ## BINARY FORMATS
         # dumped with
         # clickhouse-client ... | xxd -ps -c 200 | tr -d '\n' | sed 's/\(..\)/\\x\1/g'
-        'Native' : {
+        'Native': {
             'data_sample': [
                 '\x05\x01\x02\x69\x64\x05\x49\x6e\x74\x36\x34\x00\x00\x00\x00\x00\x00\x00\x00\x07\x62\x6c\x6f\x63\x6b\x4e\x6f\x06\x55\x49\x6e\x74\x31\x36\x00\x00\x04\x76\x61\x6c\x31\x06\x53\x74\x72\x69\x6e\x67\x02\x41\x4d\x04\x76\x61\x6c\x32\x07\x46\x6c\x6f\x61\x74\x33\x32\x00\x00\x00\x3f\x04\x76\x61\x6c\x33\x05\x55\x49\x6e\x74\x38\x01',
                 '\x05\x0f\x02\x69\x64\x05\x49\x6e\x74\x36\x34\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x00\x00\x00\x00\x00\x00\x00\x04\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x06\x00\x00\x00\x00\x00\x00\x00\x07\x00\x00\x00\x00\x00\x00\x00\x08\x00\x00\x00\x00\x00\x00\x00\x09\x00\x00\x00\x00\x00\x00\x00\x0a\x00\x00\x00\x00\x00\x00\x00\x0b\x00\x00\x00\x00\x00\x00\x00\x0c\x00\x00\x00\x00\x00\x00\x00\x0d\x00\x00\x00\x00\x00\x00\x00\x0e\x00\x00\x00\x00\x00\x00\x00\x0f\x00\x00\x00\x00\x00\x00\x00\x07\x62\x6c\x6f\x63\x6b\x4e\x6f\x06\x55\x49\x6e\x74\x31\x36\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x04\x76\x61\x6c\x31\x06\x53\x74\x72\x69\x6e\x67\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x02\x41\x4d\x04\x76\x61\x6c\x32\x07\x46\x6c\x6f\x61\x74\x33\x32\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x3f\x04\x76\x61\x6c\x33\x05\x55\x49\x6e\x74\x38\x01\x01\x01\x01\x01\x01\x01\x01\x01\x01\x01\x01\x01\x01\x01',
@@ -297,8 +299,8 @@ def test_kafka_formats(kafka_cluster):
                 # /src/Processors/ISource.cpp:48: DB::ISource::work() @ 0x1dd79737 in /usr/bin/clickhouse
             ],
         },
-        'MsgPack' : {
-            'data_sample' : [
+        'MsgPack': {
+            'data_sample': [
                 '\x00\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01',
                 '\x01\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x02\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x03\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x04\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x05\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x06\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x07\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x08\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x09\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x0a\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x0b\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x0c\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x0d\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x0e\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01\x0f\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01',
                 '\x00\x00\xa2\x41\x4d\xca\x3f\x00\x00\x00\x01',
@@ -307,8 +309,8 @@ def test_kafka_formats(kafka_cluster):
                 # coming from Processors/Formats/Impl/MsgPackRowInputFormat.cpp:170
             ],
         },
-        'RowBinary' : {
-            'data_sample' : [
+        'RowBinary': {
+            'data_sample': [
                 '\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01',
                 '\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x09\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0a\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0b\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0c\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0e\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0f\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01',
                 '\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01',
@@ -321,12 +323,12 @@ def test_kafka_formats(kafka_cluster):
                 # /src/Processors/Formats/Impl/BinaryRowInputFormat.cpp:22: DB::BinaryRowInputFormat::readRow(std::__1::vector<COW<DB::IColumn>::mutable_ptr<DB::IColumn>, std::__1::allocator<COW<DB::IColumn>::mutable_ptr<DB::IColumn> > >&, DB::RowReadExtension&) @ 0x1dea2c0b in /usr/bin/clickhouse
             ],
         },
-        'RowBinaryWithNamesAndTypes' : {
-            'data_sample' : [
+        'RowBinaryWithNamesAndTypes': {
+            'data_sample': [
                 '\x05\x02\x69\x64\x07\x62\x6c\x6f\x63\x6b\x4e\x6f\x04\x76\x61\x6c\x31\x04\x76\x61\x6c\x32\x04\x76\x61\x6c\x33\x05\x49\x6e\x74\x36\x34\x06\x55\x49\x6e\x74\x31\x36\x06\x53\x74\x72\x69\x6e\x67\x07\x46\x6c\x6f\x61\x74\x33\x32\x05\x55\x49\x6e\x74\x38\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01',
                 '\x05\x02\x69\x64\x07\x62\x6c\x6f\x63\x6b\x4e\x6f\x04\x76\x61\x6c\x31\x04\x76\x61\x6c\x32\x04\x76\x61\x6c\x33\x05\x49\x6e\x74\x36\x34\x06\x55\x49\x6e\x74\x31\x36\x06\x53\x74\x72\x69\x6e\x67\x07\x46\x6c\x6f\x61\x74\x33\x32\x05\x55\x49\x6e\x74\x38\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x09\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0a\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0b\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0c\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0e\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01\x0f\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01',
                 '\x05\x02\x69\x64\x07\x62\x6c\x6f\x63\x6b\x4e\x6f\x04\x76\x61\x6c\x31\x04\x76\x61\x6c\x32\x04\x76\x61\x6c\x33\x05\x49\x6e\x74\x36\x34\x06\x55\x49\x6e\x74\x31\x36\x06\x53\x74\x72\x69\x6e\x67\x07\x46\x6c\x6f\x61\x74\x33\x32\x05\x55\x49\x6e\x74\x38\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x02\x41\x4d\x00\x00\x00\x3f\x01',
-                #''
+                # ''
                 # !!! On empty message segfault: Address not mapped to object
                 # /contrib/FastMemcpy/FastMemcpy.h:666: memcpy_fast @ 0x21742d65 in /usr/bin/clickhouse
                 # /contrib/FastMemcpy/memcpy_wrapper.c:5: memcpy @ 0x21738235 in /usr/bin/clickhouse
@@ -336,8 +338,8 @@ def test_kafka_formats(kafka_cluster):
                 # /src/Processors/Formats/Impl/BinaryRowInputFormat.cpp:22: DB::BinaryRowInputFormat::readRow(std::__1::vector<COW<DB::IColumn>::mutable_ptr<DB::IColumn>, std::__1::allocator<COW<DB::IColumn>::mutable_ptr<DB::IColumn> > >&, DB::RowReadExtension&) @ 0x1dea2c0b in /usr/bin/clickhouse
             ],
         },
-        'Protobuf' : {
-            'data_sample' : [
+        'Protobuf': {
+            'data_sample': [
                 '\x0b\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01',
                 '\x0d\x08\x01\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x02\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x03\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x04\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x05\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x06\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x07\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x08\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x09\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x0a\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x0b\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x0c\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x0d\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x0e\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01\x0d\x08\x0f\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01',
                 '\x0b\x1a\x02\x41\x4d\x25\x00\x00\x00\x3f\x28\x01',
@@ -351,19 +353,19 @@ def test_kafka_formats(kafka_cluster):
             ],
             'extra_settings': ", kafka_schema='test:TestMessage'"
         },
-        'ORC' : {
-            'data_sample' : [
+        'ORC': {
+            'data_sample': [
                 '\x4f\x52\x43\x11\x00\x00\x0a\x06\x12\x04\x08\x01\x50\x00\x2b\x00\x00\x0a\x13\x0a\x03\x00\x00\x00\x12\x0c\x08\x01\x12\x06\x08\x00\x10\x00\x18\x00\x50\x00\x30\x00\x00\xe3\x12\xe7\x62\x65\x00\x01\x21\x3e\x0e\x46\x25\x0e\x2e\x46\x03\x21\x46\x03\x09\xa6\x00\x06\x00\x32\x00\x00\xe3\x92\xe4\x62\x65\x00\x01\x21\x01\x0e\x46\x25\x2e\x2e\x26\x47\x5f\x21\x20\x96\x60\x09\x60\x00\x00\x36\x00\x00\xe3\x92\xe1\x62\x65\x00\x01\x21\x61\x0e\x46\x23\x5e\x2e\x46\x03\x21\x66\x03\x3d\x53\x29\x10\x11\xc0\x00\x00\x2b\x00\x00\x0a\x13\x0a\x03\x00\x00\x00\x12\x0c\x08\x01\x12\x06\x08\x02\x10\x02\x18\x02\x50\x00\x05\x00\x00\xff\x00\x03\x00\x00\x30\x07\x00\x00\x40\x00\x80\x05\x00\x00\x41\x4d\x07\x00\x00\x42\x00\x80\x03\x00\x00\x0a\x07\x00\x00\x42\x00\x80\x05\x00\x00\xff\x01\x88\x00\x00\x4d\xca\xc1\x0a\x80\x30\x0c\x03\xd0\x2e\x6b\xcb\x98\x17\xf1\x14\x50\xfc\xff\xcf\xb4\x66\x1e\x3c\x84\x47\x9a\xce\x1c\xb9\x1b\xb7\xf9\xda\x48\x09\x9e\xb2\xf3\x92\xce\x5b\x86\xf6\x56\x7f\x21\x41\x2f\x51\xa6\x7a\xd7\x1d\xe5\xea\xae\x3d\xca\xd5\x83\x71\x60\xd8\x17\xfc\x62\x0f\xa8\x00\x00\xe3\x4a\xe6\x62\xe1\x60\x0c\x60\xe0\xe2\xe3\x60\x14\x62\xe3\x60\x10\x60\x90\x60\x08\x60\x88\x60\xe5\x12\xe0\x60\x54\xe2\xe0\x62\x34\x10\x62\x34\x90\x60\x02\x8a\x70\x71\x09\x01\x45\xb8\xb8\x98\x1c\x7d\x85\x80\x58\x82\x05\x28\xc6\xcd\x25\xca\xc1\x68\xc4\x0b\x52\xc5\x6c\xa0\x67\x2a\x05\x22\xc0\x4a\x21\x86\x31\x09\x30\x81\xb5\xb2\x02\x00\x36\x01\x00\x25\x8c\xbd\x0a\xc2\x30\x14\x85\x73\x6f\x92\xf6\x92\x6a\x09\x01\x21\x64\x92\x4e\x75\x91\x58\x71\xc9\x64\x27\x5d\x2c\x1d\x5d\xfd\x59\xc4\x42\x37\x5f\xc0\x17\xe8\x23\x9b\xc6\xe1\x3b\x70\x0f\xdf\xb9\xc4\xf5\x17\x5d\x41\x5c\x4f\x60\x37\xeb\x53\x0d\x55\x4d\x0b\x23\x01\xb9\x90\x2e\xbf\x0f\xe3\xe3\xdd\x8d\x0e\x5f\x4f\x27\x3e\xb7\x61\x97\xb2\x49\xb9\xaf\x90\x20\x92\x27\x32\x2a\x6b\xf4\xf3\x0d\x1e\x82\x20\xe8\x59\x28\x09\x4c\x46\x4c\x33\xcb\x7a\x76\x95\x41\x47\x9f\x14\x78\x03\xde\x62\x6c\x54\x30\xb1\x51\x0a\xdb\x8b\x89\x58\x11\xbb\x22\xac\x08\x9a\xe5\x6c\x71\xbf\x3d\xb8\x39\x92\xfa\x7f\x86\x1a\xd3\x54\x1e\xa7\xee\xcc\x7e\x08\x9e\x01\x10\x01\x18\x80\x80\x10\x22\x02\x00\x0c\x28\x57\x30\x06\x82\xf4\x03\x03\x4f\x52\x43\x18',
                 '\x4f\x52\x43\x11\x00\x00\x0a\x06\x12\x04\x08\x0f\x50\x00\x2b\x00\x00\x0a\x13\x0a\x03\x00\x00\x00\x12\x0c\x08\x0f\x12\x06\x08\x00\x10\x00\x18\x00\x50\x00\x30\x00\x00\xe3\x12\xe7\x62\x65\x00\x01\x21\x3e\x0e\x7e\x25\x0e\x2e\x46\x43\x21\x46\x4b\x09\xad\x00\x06\x00\x33\x00\x00\x0a\x17\x0a\x03\x00\x00\x00\x12\x10\x08\x0f\x22\x0a\x0a\x02\x41\x4d\x12\x02\x41\x4d\x18\x3c\x50\x00\x3a\x00\x00\xe3\x92\xe1\x62\x65\x00\x01\x21\x61\x0e\x7e\x23\x5e\x2e\x46\x03\x21\x66\x03\x3d\x53\x29\x66\x73\x3d\xd3\x00\x06\x00\x2b\x00\x00\x0a\x13\x0a\x03\x00\x00\x00\x12\x0c\x08\x0f\x12\x06\x08\x02\x10\x02\x18\x1e\x50\x00\x05\x00\x00\x0c\x00\x2b\x00\x00\x31\x32\x33\x34\x35\x36\x37\x38\x39\x31\x30\x31\x31\x31\x32\x31\x33\x31\x34\x31\x35\x09\x00\x00\x06\x01\x03\x02\x09\x00\x00\xc0\x0e\x00\x00\x07\x00\x00\x42\x00\x80\x05\x00\x00\x41\x4d\x0a\x00\x00\xe3\xe2\x42\x01\x00\x09\x00\x00\xc0\x0e\x02\x00\x05\x00\x00\x0c\x01\x94\x00\x00\x2d\xca\xc1\x0e\x80\x30\x08\x03\xd0\xc1\x60\x2e\xf3\x62\x76\x6a\xe2\x0e\xfe\xff\x57\x5a\x3b\x0f\xe4\x51\xe8\x68\xbd\x5d\x05\xe7\xf8\x34\x40\x3a\x6e\x59\xb1\x64\xe0\x91\xa9\xbf\xb1\x97\xd2\x95\x9d\x1e\xca\x55\x3a\x6d\xb4\xd2\xdd\x0b\x74\x9a\x74\xf7\x12\x39\xbd\x97\x7f\x7c\x06\xbb\xa6\x8d\x97\x17\xb4\x00\x00\xe3\x4a\xe6\x62\xe1\xe0\x0f\x60\xe0\xe2\xe3\xe0\x17\x62\xe3\x60\x10\x60\x90\x60\x08\x60\x88\x60\xe5\x12\xe0\xe0\x57\xe2\xe0\x62\x34\x14\x62\xb4\x94\xd0\x02\x8a\xc8\x73\x09\x01\x45\xb8\xb8\x98\x1c\x7d\x85\x80\x58\xc2\x06\x28\x26\xc4\x25\xca\xc1\x6f\xc4\xcb\xc5\x68\x20\xc4\x6c\xa0\x67\x2a\xc5\x6c\xae\x67\x0a\x14\xe6\x87\x1a\xc6\x24\xc0\x24\x21\x07\x32\x0c\x00\x4a\x01\x00\xe3\x60\x16\x58\xc3\x24\xc5\xcd\xc1\x2c\x30\x89\x51\xc2\x4b\xc1\x57\x83\x5f\x49\x83\x83\x47\x88\x95\x91\x89\x99\x85\x55\x8a\x3d\x29\x27\x3f\x39\xdb\x2f\x5f\x8a\x29\x33\x45\x8a\xa5\x2c\x31\xc7\x10\x4c\x1a\x81\x49\x63\x25\x26\x0e\x46\x20\x66\x07\x63\x36\x0e\x3e\x0d\x26\x03\x10\x9f\xd1\x80\xdf\x8a\x85\x83\x3f\x80\xc1\x8a\x8f\x83\x5f\x88\x8d\x83\x41\x80\x41\x82\x21\x80\x21\x82\xd5\x4a\x80\x83\x5f\x89\x83\x8b\xd1\x50\x88\xd1\x52\x42\x0b\x28\x22\x6f\x25\x04\x14\xe1\xe2\x62\x72\xf4\x15\x02\x62\x09\x1b\xa0\x98\x90\x95\x28\x07\xbf\x11\x2f\x17\xa3\x81\x10\xb3\x81\x9e\xa9\x14\xb3\xb9\x9e\x29\x50\x98\x1f\x6a\x18\x93\x00\x93\x84\x1c\xc8\x30\x87\x09\x7e\x1e\x0c\x00\x08\xa8\x01\x10\x01\x18\x80\x80\x10\x22\x02\x00\x0c\x28\x5d\x30\x06\x82\xf4\x03\x03\x4f\x52\x43\x18',
                 '\x4f\x52\x43\x11\x00\x00\x0a\x06\x12\x04\x08\x01\x50\x00\x2b\x00\x00\x0a\x13\x0a\x03\x00\x00\x00\x12\x0c\x08\x01\x12\x06\x08\x00\x10\x00\x18\x00\x50\x00\x30\x00\x00\xe3\x12\xe7\x62\x65\x00\x01\x21\x3e\x0e\x46\x25\x0e\x2e\x46\x03\x21\x46\x03\x09\xa6\x00\x06\x00\x32\x00\x00\xe3\x92\xe4\x62\x65\x00\x01\x21\x01\x0e\x46\x25\x2e\x2e\x26\x47\x5f\x21\x20\x96\x60\x09\x60\x00\x00\x36\x00\x00\xe3\x92\xe1\x62\x65\x00\x01\x21\x61\x0e\x46\x23\x5e\x2e\x46\x03\x21\x66\x03\x3d\x53\x29\x10\x11\xc0\x00\x00\x2b\x00\x00\x0a\x13\x0a\x03\x00\x00\x00\x12\x0c\x08\x01\x12\x06\x08\x02\x10\x02\x18\x02\x50\x00\x05\x00\x00\xff\x00\x03\x00\x00\x30\x07\x00\x00\x40\x00\x80\x05\x00\x00\x41\x4d\x07\x00\x00\x42\x00\x80\x03\x00\x00\x0a\x07\x00\x00\x42\x00\x80\x05\x00\x00\xff\x01\x88\x00\x00\x4d\xca\xc1\x0a\x80\x30\x0c\x03\xd0\x2e\x6b\xcb\x98\x17\xf1\x14\x50\xfc\xff\xcf\xb4\x66\x1e\x3c\x84\x47\x9a\xce\x1c\xb9\x1b\xb7\xf9\xda\x48\x09\x9e\xb2\xf3\x92\xce\x5b\x86\xf6\x56\x7f\x21\x41\x2f\x51\xa6\x7a\xd7\x1d\xe5\xea\xae\x3d\xca\xd5\x83\x71\x60\xd8\x17\xfc\x62\x0f\xa8\x00\x00\xe3\x4a\xe6\x62\xe1\x60\x0c\x60\xe0\xe2\xe3\x60\x14\x62\xe3\x60\x10\x60\x90\x60\x08\x60\x88\x60\xe5\x12\xe0\x60\x54\xe2\xe0\x62\x34\x10\x62\x34\x90\x60\x02\x8a\x70\x71\x09\x01\x45\xb8\xb8\x98\x1c\x7d\x85\x80\x58\x82\x05\x28\xc6\xcd\x25\xca\xc1\x68\xc4\x0b\x52\xc5\x6c\xa0\x67\x2a\x05\x22\xc0\x4a\x21\x86\x31\x09\x30\x81\xb5\xb2\x02\x00\x36\x01\x00\x25\x8c\xbd\x0a\xc2\x30\x14\x85\x73\x6f\x92\xf6\x92\x6a\x09\x01\x21\x64\x92\x4e\x75\x91\x58\x71\xc9\x64\x27\x5d\x2c\x1d\x5d\xfd\x59\xc4\x42\x37\x5f\xc0\x17\xe8\x23\x9b\xc6\xe1\x3b\x70\x0f\xdf\xb9\xc4\xf5\x17\x5d\x41\x5c\x4f\x60\x37\xeb\x53\x0d\x55\x4d\x0b\x23\x01\xb9\x90\x2e\xbf\x0f\xe3\xe3\xdd\x8d\x0e\x5f\x4f\x27\x3e\xb7\x61\x97\xb2\x49\xb9\xaf\x90\x20\x92\x27\x32\x2a\x6b\xf4\xf3\x0d\x1e\x82\x20\xe8\x59\x28\x09\x4c\x46\x4c\x33\xcb\x7a\x76\x95\x41\x47\x9f\x14\x78\x03\xde\x62\x6c\x54\x30\xb1\x51\x0a\xdb\x8b\x89\x58\x11\xbb\x22\xac\x08\x9a\xe5\x6c\x71\xbf\x3d\xb8\x39\x92\xfa\x7f\x86\x1a\xd3\x54\x1e\xa7\xee\xcc\x7e\x08\x9e\x01\x10\x01\x18\x80\x80\x10\x22\x02\x00\x0c\x28\x57\x30\x06\x82\xf4\x03\x03\x4f\x52\x43\x18',
-                #''
+                # ''
                 # On empty message exception:  IOError: File size too small, Stack trace (when copying this message, always include the lines below):
                 # /src/Processors/Formats/Impl/ORCBlockInputFormat.cpp:36: DB::ORCBlockInputFormat::generate() @ 0x1df282a6 in /usr/bin/clickhouse
                 # /src/Processors/ISource.cpp:48: DB::ISource::work() @ 0x1dd79737 in /usr/bin/clickhouse
             ],
         },
-        'CapnProto' : {
-            'data_sample' : [
+        'CapnProto': {
+            'data_sample': [
                 '\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00',
                 '\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x09\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x0a\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x0b\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x0c\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x0d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x0e\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x0f\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00',
                 '\x00\x00\x00\x00\x05\x00\x00\x00\x00\x00\x00\x00\x02\x00\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x3f\x01\x00\x00\x00\x1a\x00\x00\x00\x41\x4d\x00\x00\x00\x00\x00\x00',
@@ -376,7 +378,6 @@ def test_kafka_formats(kafka_cluster):
             'extra_settings': ", kafka_schema='test:TestRecordStruct'"
         },
 
-
         # 'Parquet' : {
         # not working at all with Kafka: DB::Exception: IOError: Invalid Parquet file size is 0 bytes
         # /contrib/libcxx/include/exception:129: std::exception::capture() @ 0x15c33fe8 in /usr/bin/clickhouse
@@ -416,13 +417,17 @@ def test_kafka_formats(kafka_cluster):
         #         '\x4f\x62\x6a\x01\x04\x16\x61\x76\x72\x6f\x2e\x73\x63\x68\x65\x6d\x61\x82\x03\x7b\x22\x74\x79\x70\x65\x22\x3a\x22\x72\x65\x63\x6f\x72\x64\x22\x2c\x22\x6e\x61\x6d\x65\x22\x3a\x22\x72\x6f\x77\x22\x2c\x22\x66\x69\x65\x6c\x64\x73\x22\x3a\x5b\x7b\x22\x6e\x61\x6d\x65\x22\x3a\x22\x69\x64\x22\x2c\x22\x74\x79\x70\x65\x22\x3a\x22\x6c\x6f\x6e\x67\x22\x7d\x2c\x7b\x22\x6e\x61\x6d\x65\x22\x3a\x22\x62\x6c\x6f\x63\x6b\x4e\x6f\x22\x2c\x22\x74\x79\x70\x65\x22\x3a\x22\x69\x6e\x74\x22\x7d\x2c\x7b\x22\x6e\x61\x6d\x65\x22\x3a\x22\x76\x61\x6c\x31\x22\x2c\x22\x74\x79\x70\x65\x22\x3a\x22\x73\x74\x72\x69\x6e\x67\x22\x7d\x2c\x7b\x22\x6e\x61\x6d\x65\x22\x3a\x22\x76\x61\x6c\x32\x22\x2c\x22\x74\x79\x70\x65\x22\x3a\x22\x66\x6c\x6f\x61\x74\x22\x7d\x2c\x7b\x22\x6e\x61\x6d\x65\x22\x3a\x22\x76\x61\x6c\x33\x22\x2c\x22\x74\x79\x70\x65\x22\x3a\x22\x69\x6e\x74\x22\x7d\x5d\x7d\x14\x61\x76\x72\x6f\x2e\x63\x6f\x64\x65\x63\x08\x6e\x75\x6c\x6c\x00\x73\x65\x4f\x7c\xd9\x33\xe1\x18\xdd\x30\xe8\x22\x2a\x58\x20\x6f\x02\x14\x00\x00\x04\x41\x4d\x00\x00\x00\x3f\x02\x73\x65\x4f\x7c\xd9\x33\xe1\x18\xdd\x30\xe8\x22\x2a\x58\x20\x6f',
         #     ],
         # },
-        'AvroConfluent' : {
+        'AvroConfluent': {
             'data_sample': [
-                avro_confluent_message(cluster.schema_registry_client, {'id':0L,'blockNo':0,'val1':unicode('AM'),'val2':0.5,"val3":1}),
+                avro_confluent_message(cluster.schema_registry_client,
+                                       {'id': 0L, 'blockNo': 0, 'val1': unicode('AM'), 'val2': 0.5, "val3": 1}),
 
-                ''.join(map(lambda id: avro_confluent_message(cluster.schema_registry_client, {'id':id,'blockNo':0,'val1':unicode('AM'),'val2':0.5,"val3":1}), range(1,16))),
+                ''.join(map(lambda id: avro_confluent_message(cluster.schema_registry_client,
+                                                              {'id': id, 'blockNo': 0, 'val1': unicode('AM'),
+                                                               'val2': 0.5, "val3": 1}), range(1, 16))),
 
-                avro_confluent_message(cluster.schema_registry_client, {'id':0L,'blockNo':0,'val1':unicode('AM'),'val2':0.5,"val3":1}),
+                avro_confluent_message(cluster.schema_registry_client,
+                                       {'id': 0L, 'blockNo': 0, 'val1': unicode('AM'), 'val2': 0.5, "val3": 1}),
             ],
             'extra_settings': ", format_avro_schema_registry_url='http://{}:{}'".format(
                 cluster.schema_registry_host,
@@ -476,7 +481,7 @@ def test_kafka_formats(kafka_cluster):
 
     for format_name, format_opts in all_formats.items():
         print('Set up {}'.format(format_name))
-        topic_name='format_tests_{}'.format(format_name)
+        topic_name = 'format_tests_{}'.format(format_name)
         data_sample = format_opts['data_sample']
         data_prefix = []
         # prepend empty value when supported
@@ -503,15 +508,16 @@ def test_kafka_formats(kafka_cluster):
 
             CREATE MATERIALIZED VIEW test.kafka_{format_name}_mv Engine=Log AS
                 SELECT *, _topic, _partition, _offset FROM test.kafka_{format_name};
-            '''.format(topic_name=topic_name, format_name=format_name, extra_settings=format_opts.get('extra_settings') or ''))
+            '''.format(topic_name=topic_name, format_name=format_name,
+                       extra_settings=format_opts.get('extra_settings') or ''))
 
     time.sleep(12)
 
     for format_name, format_opts in all_formats.items():
         print('Checking {}'.format(format_name))
-        topic_name='format_tests_{}'.format(format_name)
+        topic_name = 'format_tests_{}'.format(format_name)
         # shift offsets by 1 if format supports empty value
-        offsets = [1,2,3] if format_opts.get('supports_empty_value', False) else [0,1,2]
+        offsets = [1, 2, 3] if format_opts.get('supports_empty_value', False) else [0, 1, 2]
         result = instance.query('SELECT * FROM test.kafka_{format_name}_mv;'.format(format_name=format_name))
         expected = '''\
 0	0	AM	0.5	1	{topic_name}	0	{offset_0}
@@ -531,13 +537,13 @@ def test_kafka_formats(kafka_cluster):
 14	0	AM	0.5	1	{topic_name}	0	{offset_1}
 15	0	AM	0.5	1	{topic_name}	0	{offset_1}
 0	0	AM	0.5	1	{topic_name}	0	{offset_2}
-'''.format(topic_name=topic_name, offset_0 = offsets[0], offset_1 = offsets[1], offset_2 = offsets[2])
+'''.format(topic_name=topic_name, offset_0=offsets[0], offset_1=offsets[1], offset_2=offsets[2])
         assert TSV(result) == TSV(expected), 'Proper result for format: {}'.format(format_name)
 
 
 # Since everything is async and shaky when receiving messages from Kafka,
 # we may want to try and check results multiple times in a loop.
-def  kafka_check_result(result, check=False, ref_file='test_kafka_json.reference'):
+def kafka_check_result(result, check=False, ref_file='test_kafka_json.reference'):
     fpath = p.join(p.dirname(__file__), ref_file)
     with open(fpath) as reference:
         if check:
@@ -545,6 +551,7 @@ def  kafka_check_result(result, check=False, ref_file='test_kafka_json.reference
         else:
             return TSV(result) == TSV(reference)
 
+
 # https://stackoverflow.com/a/57692111/1555175
 def describe_consumer_group(name):
     client = BrokerConnection('localhost', 9092, socket.AF_INET)
@@ -567,11 +574,12 @@ def describe_consumer_group(name):
         member_info['client_host'] = client_host
         member_topics_assignment = []
         for (topic, partitions) in MemberAssignment.decode(member_assignment).assignment:
-            member_topics_assignment.append({'topic':topic, 'partitions':partitions})
+            member_topics_assignment.append({'topic': topic, 'partitions': partitions})
         member_info['assignment'] = member_topics_assignment
         res.append(member_info)
     return res
 
+
 # Fixtures
 
 @pytest.fixture(scope="module")
@@ -594,11 +602,13 @@ def kafka_setup_teardown():
     # print("kafka is available - running test")
     yield  # run test
 
+
 # Tests
 
 @pytest.mark.timeout(180)
 def test_kafka_settings_old_syntax(kafka_cluster):
-    assert TSV(instance.query("SELECT * FROM system.macros WHERE macro like 'kafka%' ORDER BY macro", ignore_error=True)) == TSV('''kafka_broker	kafka1
+    assert TSV(instance.query("SELECT * FROM system.macros WHERE macro like 'kafka%' ORDER BY macro",
+                              ignore_error=True)) == TSV('''kafka_broker	kafka1
 kafka_client_id	instance
 kafka_format_json_each_row	JSONEachRow
 kafka_group_name_new	new
@@ -631,6 +641,7 @@ kafka_topic_old	old
     assert members[0]['client_id'] == u'ClickHouse-instance-test-kafka'
     # text_desc = kafka_cluster.exec_in_container(kafka_cluster.get_container_id('kafka1'),"kafka-consumer-groups --bootstrap-server localhost:9092 --describe --members --group old --verbose"))
 
+
 @pytest.mark.timeout(180)
 def test_kafka_settings_new_syntax(kafka_cluster):
     instance.query('''
@@ -674,7 +685,8 @@ def test_kafka_settings_new_syntax(kafka_cluster):
 @pytest.mark.timeout(180)
 def test_kafka_issue11308(kafka_cluster):
     # Check that matview does respect Kafka SETTINGS
-    kafka_produce('issue11308', ['{"t": 123, "e": {"x": "woof"} }', '{"t": 123, "e": {"x": "woof"} }', '{"t": 124, "e": {"x": "test"} }'])
+    kafka_produce('issue11308', ['{"t": 123, "e": {"x": "woof"} }', '{"t": 123, "e": {"x": "woof"} }',
+                                 '{"t": 124, "e": {"x": "test"} }'])
 
     instance.query('''
         CREATE TABLE test.persistent_kafka (
@@ -722,7 +734,7 @@ def test_kafka_issue11308(kafka_cluster):
 @pytest.mark.timeout(180)
 def test_kafka_issue4116(kafka_cluster):
     # Check that format_csv_delimiter parameter works now - as part of all available format settings.
-    kafka_produce('issue4116', ['1|foo', '2|bar', '42|answer','100|multi\n101|row\n103|message'])
+    kafka_produce('issue4116', ['1|foo', '2|bar', '42|answer', '100|multi\n101|row\n103|message'])
 
     instance.query('''
         CREATE TABLE test.kafka (a UInt64, b String)
@@ -750,7 +762,6 @@ def test_kafka_issue4116(kafka_cluster):
 
 @pytest.mark.timeout(180)
 def test_kafka_consumer_hang(kafka_cluster):
-
     instance.query('''
         DROP TABLE IF EXISTS test.kafka;
         DROP TABLE IF EXISTS test.view;
@@ -781,7 +792,7 @@ def test_kafka_consumer_hang(kafka_cluster):
     # print("Attempt to drop")
     instance.query('DROP TABLE test.kafka')
 
-    #kafka_cluster.open_bash_shell('instance')
+    # kafka_cluster.open_bash_shell('instance')
 
     instance.query('''
         DROP TABLE test.consumer;
@@ -796,9 +807,9 @@ def test_kafka_consumer_hang(kafka_cluster):
     # 'dr'||'op' to avoid self matching
     assert int(instance.query("select count() from system.processes where position(lower(query),'dr'||'op')>0")) == 0
 
+
 @pytest.mark.timeout(180)
 def test_kafka_consumer_hang2(kafka_cluster):
-
     instance.query('''
         DROP TABLE IF EXISTS test.kafka;
 
@@ -824,8 +835,8 @@ def test_kafka_consumer_hang2(kafka_cluster):
     # consumer, try to poll some data
     instance.query('SELECT * FROM test.kafka2')
 
-#echo 'SELECT * FROM test.kafka; SELECT * FROM test.kafka2; DROP TABLE test.kafka;' | clickhouse client -mn &
-#    kafka_cluster.open_bash_shell('instance')
+    # echo 'SELECT * FROM test.kafka; SELECT * FROM test.kafka2; DROP TABLE test.kafka;' | clickhouse client -mn &
+    #    kafka_cluster.open_bash_shell('instance')
 
     # first consumer has pending rebalance callback unprocessed (no poll after select)
     # one of those queries was failing because of
@@ -834,7 +845,6 @@ def test_kafka_consumer_hang2(kafka_cluster):
     instance.query('DROP TABLE test.kafka')
     instance.query('DROP TABLE test.kafka2')
 
-
     # from a user perspective: we expect no hanging 'drop' queries
     # 'dr'||'op' to avoid self matching
     assert int(instance.query("select count() from system.processes where position(lower(query),'dr'||'op')>0")) == 0
@@ -1123,7 +1133,7 @@ def test_kafka_flush_on_big_message(kafka_cluster):
 
     while True:
         result = instance.query('SELECT count() FROM test.view')
-        if int(result) == kafka_messages*batch_messages:
+        if int(result) == kafka_messages * batch_messages:
             break
 
     instance.query('''
@@ -1131,7 +1141,7 @@ def test_kafka_flush_on_big_message(kafka_cluster):
         DROP TABLE test.view;
     ''')
 
-    assert int(result) == kafka_messages*batch_messages, 'ClickHouse lost some messages: {}'.format(result)
+    assert int(result) == kafka_messages * batch_messages, 'ClickHouse lost some messages: {}'.format(result)
 
 
 @pytest.mark.timeout(180)
@@ -1157,7 +1167,9 @@ def test_kafka_virtual_columns(kafka_cluster):
 
     result = ''
     while True:
-        result += instance.query('''SELECT _key, key, _topic, value, _offset, _partition, _timestamp = 0 ? '0000-00-00 00:00:00' : toString(_timestamp) AS _timestamp FROM test.kafka''', ignore_error=True)
+        result += instance.query(
+            '''SELECT _key, key, _topic, value, _offset, _partition, _timestamp = 0 ? '0000-00-00 00:00:00' : toString(_timestamp) AS _timestamp FROM test.kafka''',
+            ignore_error=True)
         if kafka_check_result(result, False, 'test_kafka_virtual1.reference'):
             break
 
@@ -1258,6 +1270,7 @@ def test_kafka_produce_consume(kafka_cluster):
     ''')
 
     messages_num = 10000
+
     def insert():
         values = []
         for i in range(messages_num):
@@ -1322,6 +1335,7 @@ def test_kafka_commit_on_block_write(kafka_cluster):
     cancel = threading.Event()
 
     i = [0]
+
     def produce():
         while not cancel.is_set():
             messages = []
@@ -1373,7 +1387,6 @@ def test_kafka_commit_on_block_write(kafka_cluster):
 
 @pytest.mark.timeout(180)
 def test_kafka_virtual_columns2(kafka_cluster):
-
     admin_client = KafkaAdminClient(bootstrap_servers="localhost:9092")
     topic_list = []
     topic_list.append(NewTopic(name="virt2_0", num_partitions=2, replication_factor=1))
@@ -1396,13 +1409,17 @@ def test_kafka_virtual_columns2(kafka_cluster):
 
     producer = KafkaProducer(bootstrap_servers="localhost:9092")
 
-    producer.send(topic='virt2_0', value=json.dumps({'value': 1}), partition=0, key='k1', timestamp_ms=1577836801001, headers=[('content-encoding', b'base64')])
-    producer.send(topic='virt2_0', value=json.dumps({'value': 2}), partition=0, key='k2', timestamp_ms=1577836802002, headers=[('empty_value', ''),('', 'empty name'), ('',''), ('repetition', '1'), ('repetition', '2')])
+    producer.send(topic='virt2_0', value=json.dumps({'value': 1}), partition=0, key='k1', timestamp_ms=1577836801001,
+                  headers=[('content-encoding', b'base64')])
+    producer.send(topic='virt2_0', value=json.dumps({'value': 2}), partition=0, key='k2', timestamp_ms=1577836802002,
+                  headers=[('empty_value', ''), ('', 'empty name'), ('', ''), ('repetition', '1'), ('repetition', '2')])
     producer.flush()
     time.sleep(1)
 
-    producer.send(topic='virt2_0', value=json.dumps({'value': 3}), partition=1, key='k3', timestamp_ms=1577836803003, headers=[('b', 'b'),('a', 'a')])
-    producer.send(topic='virt2_0', value=json.dumps({'value': 4}), partition=1, key='k4', timestamp_ms=1577836804004, headers=[('a', 'a'),('b', 'b')])
+    producer.send(topic='virt2_0', value=json.dumps({'value': 3}), partition=1, key='k3', timestamp_ms=1577836803003,
+                  headers=[('b', 'b'), ('a', 'a')])
+    producer.send(topic='virt2_0', value=json.dumps({'value': 4}), partition=1, key='k4', timestamp_ms=1577836804004,
+                  headers=[('a', 'a'), ('b', 'b')])
     producer.flush()
     time.sleep(1)
 
@@ -1418,7 +1435,7 @@ def test_kafka_virtual_columns2(kafka_cluster):
     time.sleep(10)
 
     members = describe_consumer_group('virt2')
-    #pprint.pprint(members)
+    # pprint.pprint(members)
     members[0]['client_id'] = u'ClickHouse-instance-test-kafka-0'
     members[1]['client_id'] = u'ClickHouse-instance-test-kafka-1'
 
@@ -1438,7 +1455,6 @@ def test_kafka_virtual_columns2(kafka_cluster):
     assert TSV(result) == TSV(expected)
 
 
-
 @pytest.mark.timeout(240)
 def test_kafka_produce_key_timestamp(kafka_cluster):
     instance.query('''
@@ -1464,10 +1480,16 @@ def test_kafka_produce_key_timestamp(kafka_cluster):
             SELECT key, value, inserted_key, toUnixTimestamp(inserted_timestamp), _key, _topic, _partition, _offset, toUnixTimestamp(_timestamp) FROM test.kafka;
     ''')
 
-    instance.query("INSERT INTO test.kafka_writer VALUES ({},{},'{}',toDateTime({}))".format(1,1,'k1',1577836801))
-    instance.query("INSERT INTO test.kafka_writer VALUES ({},{},'{}',toDateTime({}))".format(2,2,'k2',1577836802))
-    instance.query("INSERT INTO test.kafka_writer VALUES ({},{},'{}',toDateTime({})),({},{},'{}',toDateTime({}))".format(3,3,'k3',1577836803,4,4,'k4',1577836804))
-    instance.query("INSERT INTO test.kafka_writer VALUES ({},{},'{}',toDateTime({}))".format(5,5,'k5',1577836805))
+    instance.query("INSERT INTO test.kafka_writer VALUES ({},{},'{}',toDateTime({}))".format(1, 1, 'k1', 1577836801))
+    instance.query("INSERT INTO test.kafka_writer VALUES ({},{},'{}',toDateTime({}))".format(2, 2, 'k2', 1577836802))
+    instance.query(
+        "INSERT INTO test.kafka_writer VALUES ({},{},'{}',toDateTime({})),({},{},'{}',toDateTime({}))".format(3, 3,
+                                                                                                              'k3',
+                                                                                                              1577836803,
+                                                                                                              4, 4,
+                                                                                                              'k4',
+                                                                                                              1577836804))
+    instance.query("INSERT INTO test.kafka_writer VALUES ({},{},'{}',toDateTime({}))".format(5, 5, 'k5', 1577836805))
 
     while int(instance.query("SELECT count() FROM test.view")) < 5:
         time.sleep(1)
@@ -1487,7 +1509,6 @@ def test_kafka_produce_key_timestamp(kafka_cluster):
     assert TSV(result) == TSV(expected)
 
 
-
 @pytest.mark.timeout(600)
 def test_kafka_flush_by_time(kafka_cluster):
     instance.query('''
@@ -1581,7 +1602,8 @@ def test_kafka_flush_by_block_size(kafka_cluster):
     ''')
 
     # Wait for Kafka engine to consume this data
-    while 1 != int(instance.query("SELECT count() FROM system.parts WHERE database = 'test' AND table = 'view' AND name = 'all_1_1_0'")):
+    while 1 != int(instance.query(
+            "SELECT count() FROM system.parts WHERE database = 'test' AND table = 'view' AND name = 'all_1_1_0'")):
         time.sleep(0.5)
 
     cancel.set()
@@ -1596,10 +1618,10 @@ def test_kafka_flush_by_block_size(kafka_cluster):
         DROP TABLE test.view;
     ''')
 
-
     # 100 = first poll should return 100 messages (and rows)
     # not waiting for stream_flush_interval_ms
-    assert int(result) == 100, 'Messages from kafka should be flushed when block of size kafka_max_block_size is formed!'
+    assert int(
+        result) == 100, 'Messages from kafka should be flushed when block of size kafka_max_block_size is formed!'
 
 
 @pytest.mark.timeout(600)
@@ -1631,7 +1653,7 @@ def test_kafka_lot_of_partitions_partial_commit_of_bulk(kafka_cluster):
     count = 0
     for dummy_msg in range(1000):
         rows = []
-        for dummy_row in range(random.randrange(3,10)):
+        for dummy_row in range(random.randrange(3, 10)):
             count = count + 1
             rows.append(json.dumps({'key': count, 'value': count}))
         messages.append("\n".join(rows))
@@ -1641,17 +1663,17 @@ def test_kafka_lot_of_partitions_partial_commit_of_bulk(kafka_cluster):
 
     result = instance.query('SELECT count(), uniqExact(key), max(key) FROM test.view')
     print(result)
-    assert TSV(result) == TSV('{0}\t{0}\t{0}'.format(count) )
+    assert TSV(result) == TSV('{0}\t{0}\t{0}'.format(count))
 
     instance.query('''
         DROP TABLE test.consumer;
         DROP TABLE test.view;
     ''')
 
+
 @pytest.mark.timeout(1200)
 def test_kafka_rebalance(kafka_cluster):
-
-    NUMBER_OF_CONSURRENT_CONSUMERS=11
+    NUMBER_OF_CONSURRENT_CONSUMERS = 11
 
     instance.query('''
         DROP TABLE IF EXISTS test.destination;
@@ -1669,9 +1691,9 @@ def test_kafka_rebalance(kafka_cluster):
         ORDER BY key;
     ''')
 
-   # kafka_cluster.open_bash_shell('instance')
+    # kafka_cluster.open_bash_shell('instance')
 
-    #time.sleep(2)
+    # time.sleep(2)
 
     admin_client = KafkaAdminClient(bootstrap_servers="localhost:9092")
     topic_list = []
@@ -1681,6 +1703,7 @@ def test_kafka_rebalance(kafka_cluster):
     cancel = threading.Event()
 
     msg_index = [0]
+
     def produce():
         while not cancel.is_set():
             messages = []
@@ -1719,17 +1742,20 @@ def test_kafka_rebalance(kafka_cluster):
             FROM test.{0};
         '''.format(table_name))
         # kafka_cluster.open_bash_shell('instance')
-        while int(instance.query("SELECT count() FROM test.destination WHERE _consumed_by='{}'".format(table_name))) == 0:
+        while int(
+                instance.query("SELECT count() FROM test.destination WHERE _consumed_by='{}'".format(table_name))) == 0:
             print("Waiting for test.kafka_consumer{} to start consume".format(consumer_index))
             time.sleep(1)
 
     cancel.set()
 
     # I leave last one working by intent (to finish consuming after all rebalances)
-    for consumer_index in range(NUMBER_OF_CONSURRENT_CONSUMERS-1):
+    for consumer_index in range(NUMBER_OF_CONSURRENT_CONSUMERS - 1):
         print("Dropping test.kafka_consumer{}".format(consumer_index))
         instance.query('DROP TABLE IF EXISTS test.kafka_consumer{}'.format(consumer_index))
-        while int(instance.query("SELECT count() FROM system.tables WHERE database='test' AND name='kafka_consumer{}'".format(consumer_index))) == 1:
+        while int(instance.query(
+                "SELECT count() FROM system.tables WHERE database='test' AND name='kafka_consumer{}'".format(
+                    consumer_index))) == 1:
             time.sleep(1)
 
     # print(instance.query('SELECT count(), uniqExact(key), max(key) + 1 FROM test.destination'))
@@ -1740,7 +1766,7 @@ def test_kafka_rebalance(kafka_cluster):
         if messages_consumed >= msg_index[0]:
             break
         time.sleep(1)
-        print("Waiting for finishing consuming (have {}, should be {})".format(messages_consumed,msg_index[0]))
+        print("Waiting for finishing consuming (have {}, should be {})".format(messages_consumed, msg_index[0]))
 
     print(instance.query('SELECT count(), uniqExact(key), max(key) + 1 FROM test.destination'))
 
@@ -1782,9 +1808,10 @@ def test_kafka_rebalance(kafka_cluster):
 
     assert result == 1, 'Messages from kafka get duplicated!'
 
+
 @pytest.mark.timeout(1200)
 def test_kafka_no_holes_when_write_suffix_failed(kafka_cluster):
-    messages = [json.dumps({'key': j+1, 'value': 'x' * 300}) for j in range(22)]
+    messages = [json.dumps({'key': j + 1, 'value': 'x' * 300}) for j in range(22)]
     kafka_produce('no_holes_when_write_suffix_failed', messages)
 
     instance.query('''
@@ -1864,13 +1891,13 @@ def test_exception_from_destructor(kafka_cluster):
         DROP TABLE test.kafka;
     ''')
 
-    #kafka_cluster.open_bash_shell('instance')
+    # kafka_cluster.open_bash_shell('instance')
     assert TSV(instance.query('SELECT 1')) == TSV('1')
 
 
 @pytest.mark.timeout(120)
 def test_commits_of_unprocessed_messages_on_drop(kafka_cluster):
-    messages = [json.dumps({'key': j+1, 'value': j+1}) for j in range(1)]
+    messages = [json.dumps({'key': j + 1, 'value': j + 1}) for j in range(1)]
     kafka_produce('commits_of_unprocessed_messages_on_drop', messages)
 
     instance.query('''
@@ -1915,6 +1942,7 @@ def test_commits_of_unprocessed_messages_on_drop(kafka_cluster):
     cancel = threading.Event()
 
     i = [2]
+
     def produce():
         while not cancel.is_set():
             messages = []
@@ -1945,7 +1973,7 @@ def test_commits_of_unprocessed_messages_on_drop(kafka_cluster):
     cancel.set()
     time.sleep(15)
 
-    #kafka_cluster.open_bash_shell('instance')
+    # kafka_cluster.open_bash_shell('instance')
     # SELECT key, _timestamp, _offset FROM test.destination where runningDifference(key) <> 1 ORDER BY key;
 
     result = instance.query('SELECT count(), uniqExact(key), max(key) FROM test.destination')
@@ -1957,13 +1985,12 @@ def test_commits_of_unprocessed_messages_on_drop(kafka_cluster):
     ''')
 
     kafka_thread.join()
-    assert TSV(result) == TSV('{0}\t{0}\t{0}'.format(i[0]-1)), 'Missing data!'
-
+    assert TSV(result) == TSV('{0}\t{0}\t{0}'.format(i[0] - 1)), 'Missing data!'
 
 
 @pytest.mark.timeout(120)
 def test_bad_reschedule(kafka_cluster):
-    messages = [json.dumps({'key': j+1, 'value': j+1}) for j in range(20000)]
+    messages = [json.dumps({'key': j + 1, 'value': j + 1}) for j in range(20000)]
     kafka_produce('test_bad_reschedule', messages)
 
     instance.query('''
@@ -1997,7 +2024,7 @@ def test_bad_reschedule(kafka_cluster):
 
 @pytest.mark.timeout(1200)
 def test_kafka_duplicates_when_commit_failed(kafka_cluster):
-    messages = [json.dumps({'key': j+1, 'value': 'x' * 300}) for j in range(22)]
+    messages = [json.dumps({'key': j + 1, 'value': 'x' * 300}) for j in range(22)]
     kafka_produce('duplicates_when_commit_failed', messages)
 
     instance.query('''
@@ -2021,20 +2048,21 @@ def test_kafka_duplicates_when_commit_failed(kafka_cluster):
             WHERE NOT sleepEachRow(0.5);
     ''')
 
-    #print time.strftime("%m/%d/%Y %H:%M:%S")
-    time.sleep(12) # 5-6 sec to connect to kafka, do subscription, and fetch 20 rows, another 10 sec for MV, after that commit should happen
+    # print time.strftime("%m/%d/%Y %H:%M:%S")
+    time.sleep(
+        12)  # 5-6 sec to connect to kafka, do subscription, and fetch 20 rows, another 10 sec for MV, after that commit should happen
 
-    #print time.strftime("%m/%d/%Y %H:%M:%S")
+    # print time.strftime("%m/%d/%Y %H:%M:%S")
     kafka_cluster.pause_container('kafka1')
     # that timeout it VERY important, and picked after lot of experiments
     # when too low (<30sec) librdkafka will not report any timeout (alternative is to decrease the default session timeouts for librdkafka)
     # when too high (>50sec) broker will decide to remove us from the consumer group, and will start answering "Broker: Unknown member"
     time.sleep(40)
 
-    #print time.strftime("%m/%d/%Y %H:%M:%S")
+    # print time.strftime("%m/%d/%Y %H:%M:%S")
     kafka_cluster.unpause_container('kafka1')
 
-    #kafka_cluster.open_bash_shell('instance')
+    # kafka_cluster.open_bash_shell('instance')
 
     # connection restored and it will take a while until next block will be flushed
     # it takes years on CI :\
@@ -2057,6 +2085,7 @@ def test_kafka_duplicates_when_commit_failed(kafka_cluster):
     # impossible. So we have a duplicate in that scenario, but we report that situation properly.
     assert TSV(result) == TSV('42\t22\t22')
 
+
 # if we came to partition end we will repeat polling until reaching kafka_max_block_size or flush_interval
 # that behavior is a bit quesionable - we can just take a bigger pauses between polls instead -
 # to do more job in a single pass, and give more rest for a thread.
@@ -2087,7 +2116,7 @@ def test_premature_flush_on_eof(kafka_cluster):
         ORDER BY key;
     ''')
 
-    messages = [json.dumps({'key': j+1, 'value': j+1}) for j in range(1)]
+    messages = [json.dumps({'key': j + 1, 'value': j + 1}) for j in range(1)]
     kafka_produce('premature_flush_on_eof', messages)
 
     instance.query('''
@@ -2103,7 +2132,6 @@ def test_premature_flush_on_eof(kafka_cluster):
         FROM test.kafka;
     ''')
 
-
     # all subscriptions/assignments done during select, so it start sending data to test.destination
     # immediately after creation of MV
     time.sleep(2)
@@ -2125,7 +2153,7 @@ def test_premature_flush_on_eof(kafka_cluster):
 
 @pytest.mark.timeout(180)
 def test_kafka_unavailable(kafka_cluster):
-    messages = [json.dumps({'key': j+1, 'value': j+1}) for j in range(20000)]
+    messages = [json.dumps({'key': j + 1, 'value': j + 1}) for j in range(20000)]
     kafka_produce('test_bad_reschedule', messages)
 
     kafka_cluster.pause_container('kafka1')
@@ -2163,6 +2191,7 @@ def test_kafka_unavailable(kafka_cluster):
         print("Waiting for consume")
         time.sleep(1)
 
+
 @pytest.mark.timeout(180)
 def test_kafka_issue14202(kafka_cluster):
     instance.query('''
@@ -2184,7 +2213,8 @@ def test_kafka_issue14202(kafka_cluster):
 
     time.sleep(3)
 
-    instance.query('INSERT INTO test.kafka_q SELECT t, some_string  FROM ( SELECT dt AS t, some_string FROM test.empty_table )')
+    instance.query(
+        'INSERT INTO test.kafka_q SELECT t, some_string  FROM ( SELECT dt AS t, some_string FROM test.empty_table )')
     # check instance is alive
     assert TSV(instance.query('SELECT 1')) == TSV('1')
     instance.query('''
@@ -2192,6 +2222,7 @@ def test_kafka_issue14202(kafka_cluster):
         DROP TABLE test.kafka_q;
     ''')
 
+
 @pytest.mark.timeout(180)
 def test_kafka_csv_with_thread_per_consumer(kafka_cluster):
     instance.query('''
@@ -2219,6 +2250,7 @@ def test_kafka_csv_with_thread_per_consumer(kafka_cluster):
 
     kafka_check_result(result, True)
 
+
 if __name__ == '__main__':
     cluster.start()
     raw_input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_storage_mongodb/test.py b/tests/integration/test_storage_mongodb/test.py
index 90534949b0b..f75a9aac237 100644
--- a/tests/integration/test_storage_mongodb/test.py
+++ b/tests/integration/test_storage_mongodb/test.py
@@ -3,7 +3,6 @@ import pymongo
 import pytest
 from helpers.client import QueryRuntimeException
 
-
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
@@ -36,7 +35,8 @@ def test_simple_select(started_cluster):
         data.append({'key': i, 'data': hex(i * i)})
     simple_mongo_table.insert_many(data)
 
-    node.query("CREATE TABLE simple_mongo_table(key UInt64, data String) ENGINE = MongoDB('mongo1:27017', 'test', 'simple_table', 'root', 'clickhouse')")
+    node.query(
+        "CREATE TABLE simple_mongo_table(key UInt64, data String) ENGINE = MongoDB('mongo1:27017', 'test', 'simple_table', 'root', 'clickhouse')")
 
     assert node.query("SELECT COUNT() FROM simple_mongo_table") == '100\n'
     assert node.query("SELECT sum(key) FROM simple_mongo_table") == str(sum(range(0, 100))) + '\n'
@@ -51,10 +51,11 @@ def test_complex_data_type(started_cluster):
     incomplete_mongo_table = db['complex_table']
     data = []
     for i in range(0, 100):
-        data.append({'key': i, 'data': hex(i * i), 'dict': {'a' : i, 'b': str(i)}})
+        data.append({'key': i, 'data': hex(i * i), 'dict': {'a': i, 'b': str(i)}})
     incomplete_mongo_table.insert_many(data)
 
-    node.query("CREATE TABLE incomplete_mongo_table(key UInt64, data String) ENGINE = MongoDB('mongo1:27017', 'test', 'complex_table', 'root', 'clickhouse')")
+    node.query(
+        "CREATE TABLE incomplete_mongo_table(key UInt64, data String) ENGINE = MongoDB('mongo1:27017', 'test', 'complex_table', 'root', 'clickhouse')")
 
     assert node.query("SELECT COUNT() FROM incomplete_mongo_table") == '100\n'
     assert node.query("SELECT sum(key) FROM incomplete_mongo_table") == str(sum(range(0, 100))) + '\n'
@@ -72,7 +73,8 @@ def test_incorrect_data_type(started_cluster):
         data.append({'key': i, 'data': hex(i * i), 'aaaa': 'Hello'})
     strange_mongo_table.insert_many(data)
 
-    node.query("CREATE TABLE strange_mongo_table(key String, data String) ENGINE = MongoDB('mongo1:27017', 'test', 'strange_table', 'root', 'clickhouse')")
+    node.query(
+        "CREATE TABLE strange_mongo_table(key String, data String) ENGINE = MongoDB('mongo1:27017', 'test', 'strange_table', 'root', 'clickhouse')")
 
     with pytest.raises(QueryRuntimeException):
         node.query("SELECT COUNT() FROM strange_mongo_table")
@@ -80,7 +82,8 @@ def test_incorrect_data_type(started_cluster):
     with pytest.raises(QueryRuntimeException):
         node.query("SELECT uniq(key) FROM strange_mongo_table")
 
-    node.query("CREATE TABLE strange_mongo_table2(key UInt64, data String, bbbb String) ENGINE = MongoDB('mongo1:27017', 'test', 'strange_table', 'root', 'clickhouse')")
+    node.query(
+        "CREATE TABLE strange_mongo_table2(key UInt64, data String, bbbb String) ENGINE = MongoDB('mongo1:27017', 'test', 'strange_table', 'root', 'clickhouse')")
 
     with pytest.raises(QueryRuntimeException):
         node.query("SELECT bbbb FROM strange_mongo_table2")
diff --git a/tests/integration/test_storage_mysql/test.py b/tests/integration/test_storage_mysql/test.py
index a2a5fe9263b..0b73866eaee 100644
--- a/tests/integration/test_storage_mysql/test.py
+++ b/tests/integration/test_storage_mysql/test.py
@@ -1,10 +1,8 @@
 from contextlib import contextmanager
 
-import pytest
-
 ## sudo -H pip install PyMySQL
 import pymysql.cursors
-
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
@@ -43,7 +41,9 @@ def test_insert_select(started_cluster):
     node1.query('''
 CREATE TABLE {}(id UInt32, name String, age UInt32, money UInt32) ENGINE = MySQL('mysql1:3306', 'clickhouse', '{}', 'root', 'clickhouse');
 '''.format(table_name, table_name))
-    node1.query("INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(table_name))
+    node1.query(
+        "INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(
+            table_name))
     assert node1.query("SELECT count() FROM {}".format(table_name)).rstrip() == '10000'
     assert node1.query("SELECT sum(money) FROM {}".format(table_name)).rstrip() == '30000'
     conn.close()
@@ -57,8 +57,12 @@ def test_replace_select(started_cluster):
     node1.query('''
 CREATE TABLE {}(id UInt32, name String, age UInt32, money UInt32) ENGINE = MySQL('mysql1:3306', 'clickhouse', '{}', 'root', 'clickhouse', 1);
 '''.format(table_name, table_name))
-    node1.query("INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(table_name))
-    node1.query("INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(table_name))
+    node1.query(
+        "INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(
+            table_name))
+    node1.query(
+        "INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(
+            table_name))
     assert node1.query("SELECT count() FROM {}".format(table_name)).rstrip() == '10000'
     assert node1.query("SELECT sum(money) FROM {}".format(table_name)).rstrip() == '30000'
     conn.close()
@@ -72,8 +76,12 @@ def test_insert_on_duplicate_select(started_cluster):
     node1.query('''
 CREATE TABLE {}(id UInt32, name String, age UInt32, money UInt32) ENGINE = MySQL('mysql1:3306', 'clickhouse', '{}', 'root', 'clickhouse', 0, 'update money = money + values(money)');
 '''.format(table_name, table_name))
-    node1.query("INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(table_name))
-    node1.query("INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(table_name))
+    node1.query(
+        "INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(
+            table_name))
+    node1.query(
+        "INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(
+            table_name))
     assert node1.query("SELECT count() FROM {}".format(table_name)).rstrip() == '10000'
     assert node1.query("SELECT sum(money) FROM {}".format(table_name)).rstrip() == '60000'
     conn.close()
@@ -86,13 +94,17 @@ def test_where(started_cluster):
     node1.query('''
 CREATE TABLE {}(id UInt32, name String, age UInt32, money UInt32) ENGINE = MySQL('mysql1:3306', 'clickhouse', '{}', 'root', 'clickhouse');
 '''.format(table_name, table_name))
-    node1.query("INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(table_name))
+    node1.query(
+        "INSERT INTO {}(id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000) ".format(
+            table_name))
     assert node1.query("SELECT count() FROM {} WHERE name LIKE '%name_%'".format(table_name)).rstrip() == '10000'
     assert node1.query("SELECT count() FROM {} WHERE name NOT LIKE '%tmp_%'".format(table_name)).rstrip() == '10000'
     assert node1.query("SELECT count() FROM {} WHERE money IN (1, 2, 3)".format(table_name)).rstrip() == '10000'
     assert node1.query("SELECT count() FROM {} WHERE money IN (1, 2, 4, 5, 6)".format(table_name)).rstrip() == '0'
-    assert node1.query("SELECT count() FROM {} WHERE money NOT IN (1, 2, 4, 5, 6)".format(table_name)).rstrip() == '10000'
-    assert node1.query("SELECT count() FROM {} WHERE name LIKE concat('name_', toString(1))".format(table_name)).rstrip() == '1'
+    assert node1.query(
+        "SELECT count() FROM {} WHERE money NOT IN (1, 2, 4, 5, 6)".format(table_name)).rstrip() == '10000'
+    assert node1.query(
+        "SELECT count() FROM {} WHERE name LIKE concat('name_', toString(1))".format(table_name)).rstrip() == '1'
     conn.close()
 
 
@@ -101,16 +113,19 @@ def test_table_function(started_cluster):
     create_mysql_table(conn, 'table_function')
     table_function = "mysql('mysql1:3306', 'clickhouse', '{}', 'root', 'clickhouse')".format('table_function')
     assert node1.query("SELECT count() FROM {}".format(table_function)).rstrip() == '0'
-    node1.query("INSERT INTO {} (id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000)".format(
-        'TABLE FUNCTION ' + table_function))
+    node1.query(
+        "INSERT INTO {} (id, name, money) select number, concat('name_', toString(number)), 3 from numbers(10000)".format(
+            'TABLE FUNCTION ' + table_function))
     assert node1.query("SELECT count() FROM {}".format(table_function)).rstrip() == '10000'
     assert node1.query("SELECT sum(c) FROM ("
                        "SELECT count() as c FROM {} WHERE id % 3 == 0"
                        " UNION ALL SELECT count() as c FROM {} WHERE id % 3 == 1"
-                       " UNION ALL SELECT count() as c FROM {} WHERE id % 3 == 2)".format(table_function, table_function,
+                       " UNION ALL SELECT count() as c FROM {} WHERE id % 3 == 2)".format(table_function,
+                                                                                          table_function,
                                                                                           table_function)).rstrip() == '10000'
     assert node1.query("SELECT sum(`money`) FROM {}".format(table_function)).rstrip() == '30000'
-    node1.query("INSERT INTO {} (id, name, age, money) SELECT id + 100000, name, age, money FROM {}".format('TABLE FUNCTION ' + table_function, table_function))
+    node1.query("INSERT INTO {} (id, name, age, money) SELECT id + 100000, name, age, money FROM {}".format(
+        'TABLE FUNCTION ' + table_function, table_function))
     assert node1.query("SELECT sum(`money`) FROM {}".format(table_function)).rstrip() == '60000'
     conn.close()
 
@@ -127,7 +142,6 @@ CREATE TABLE {}(id UInt32, name String, age UInt32, money UInt32, source Enum8('
     conn.close()
 
 
-
 def get_mysql_conn():
     conn = pymysql.connect(user='root', password='clickhouse', host='127.0.0.1', port=3308)
     return conn
diff --git a/tests/integration/test_storage_rabbitmq/rabbitmq_pb2.py b/tests/integration/test_storage_rabbitmq/rabbitmq_pb2.py
index bd03d3c21d6..6abc087dc75 100644
--- a/tests/integration/test_storage_rabbitmq/rabbitmq_pb2.py
+++ b/tests/integration/test_storage_rabbitmq/rabbitmq_pb2.py
@@ -6,72 +6,66 @@ from google.protobuf import descriptor as _descriptor
 from google.protobuf import message as _message
 from google.protobuf import reflection as _reflection
 from google.protobuf import symbol_database as _symbol_database
+
 # @@protoc_insertion_point(imports)
 
 _sym_db = _symbol_database.Default()
 
-
-
-
 DESCRIPTOR = _descriptor.FileDescriptor(
-  name='clickhouse_path/format_schemas/rabbitmq.proto',
-  package='',
-  syntax='proto3',
-  serialized_options=None,
-  create_key=_descriptor._internal_create_key,
-  serialized_pb=b'\n-clickhouse_path/format_schemas/rabbitmq.proto\"+\n\rKeyValueProto\x12\x0b\n\x03key\x18\x01 \x01(\x04\x12\r\n\x05value\x18\x02 \x01(\tb\x06proto3'
+    name='clickhouse_path/format_schemas/rabbitmq.proto',
+    package='',
+    syntax='proto3',
+    serialized_options=None,
+    create_key=_descriptor._internal_create_key,
+    serialized_pb=b'\n-clickhouse_path/format_schemas/rabbitmq.proto\"+\n\rKeyValueProto\x12\x0b\n\x03key\x18\x01 \x01(\x04\x12\r\n\x05value\x18\x02 \x01(\tb\x06proto3'
 )
 
-
-
-
 _KEYVALUEPROTO = _descriptor.Descriptor(
-  name='KeyValueProto',
-  full_name='KeyValueProto',
-  filename=None,
-  file=DESCRIPTOR,
-  containing_type=None,
-  create_key=_descriptor._internal_create_key,
-  fields=[
-    _descriptor.FieldDescriptor(
-      name='key', full_name='KeyValueProto.key', index=0,
-      number=1, type=4, cpp_type=4, label=1,
-      has_default_value=False, default_value=0,
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      serialized_options=None, file=DESCRIPTOR,  create_key=_descriptor._internal_create_key),
-    _descriptor.FieldDescriptor(
-      name='value', full_name='KeyValueProto.value', index=1,
-      number=2, type=9, cpp_type=9, label=1,
-      has_default_value=False, default_value=b"".decode('utf-8'),
-      message_type=None, enum_type=None, containing_type=None,
-      is_extension=False, extension_scope=None,
-      serialized_options=None, file=DESCRIPTOR,  create_key=_descriptor._internal_create_key),
-  ],
-  extensions=[
-  ],
-  nested_types=[],
-  enum_types=[
-  ],
-  serialized_options=None,
-  is_extendable=False,
-  syntax='proto3',
-  extension_ranges=[],
-  oneofs=[
-  ],
-  serialized_start=49,
-  serialized_end=92,
+    name='KeyValueProto',
+    full_name='KeyValueProto',
+    filename=None,
+    file=DESCRIPTOR,
+    containing_type=None,
+    create_key=_descriptor._internal_create_key,
+    fields=[
+        _descriptor.FieldDescriptor(
+            name='key', full_name='KeyValueProto.key', index=0,
+            number=1, type=4, cpp_type=4, label=1,
+            has_default_value=False, default_value=0,
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            serialized_options=None, file=DESCRIPTOR, create_key=_descriptor._internal_create_key),
+        _descriptor.FieldDescriptor(
+            name='value', full_name='KeyValueProto.value', index=1,
+            number=2, type=9, cpp_type=9, label=1,
+            has_default_value=False, default_value=b"".decode('utf-8'),
+            message_type=None, enum_type=None, containing_type=None,
+            is_extension=False, extension_scope=None,
+            serialized_options=None, file=DESCRIPTOR, create_key=_descriptor._internal_create_key),
+    ],
+    extensions=[
+    ],
+    nested_types=[],
+    enum_types=[
+    ],
+    serialized_options=None,
+    is_extendable=False,
+    syntax='proto3',
+    extension_ranges=[],
+    oneofs=[
+    ],
+    serialized_start=49,
+    serialized_end=92,
 )
 
 DESCRIPTOR.message_types_by_name['KeyValueProto'] = _KEYVALUEPROTO
 _sym_db.RegisterFileDescriptor(DESCRIPTOR)
 
 KeyValueProto = _reflection.GeneratedProtocolMessageType('KeyValueProto', (_message.Message,), {
-  'DESCRIPTOR' : _KEYVALUEPROTO,
-  '__module__' : 'clickhouse_path.format_schemas.rabbitmq_pb2'
-  # @@protoc_insertion_point(class_scope:KeyValueProto)
-  })
+    'DESCRIPTOR': _KEYVALUEPROTO,
+    '__module__': 'clickhouse_path.format_schemas.rabbitmq_pb2'
+    # @@protoc_insertion_point(class_scope:KeyValueProto)
+})
 _sym_db.RegisterMessage(KeyValueProto)
 
-
 # @@protoc_insertion_point(module_scope)
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 370515956ea..4d892eaa72c 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -1,29 +1,23 @@
+import json
 import os.path as p
 import random
+import subprocess
 import threading
 import time
-import pytest
-
 from random import randrange
-import pika
-from sys import getdefaultencoding
 
+import pika
+import pytest
+from google.protobuf.internal.encoder import _VarintBytes
+from helpers.client import QueryRuntimeException
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
-from helpers.client import QueryRuntimeException
-from helpers.network import PartitionManager
-
-import json
-import subprocess
-
-from confluent.schemaregistry.serializers.MessageSerializer import MessageSerializer
-from google.protobuf.internal.encoder import _VarintBytes
 
 import rabbitmq_pb2
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance('instance',
-                                main_configs=['configs/rabbitmq.xml','configs/log_conf.xml'],
+                                main_configs=['configs/rabbitmq.xml', 'configs/log_conf.xml'],
                                 with_rabbitmq=True)
 #                                clickhouse_path_dir='clickhouse_path')
 rabbitmq_id = ''
@@ -542,7 +536,6 @@ def test_rabbitmq_big_message(rabbitmq_cluster):
 
 @pytest.mark.timeout(420)
 def test_rabbitmq_sharding_between_queues_publish(rabbitmq_cluster):
-
     NUM_CONSUMERS = 10
     NUM_QUEUES = 2
 
@@ -570,6 +563,7 @@ def test_rabbitmq_sharding_between_queues_publish(rabbitmq_cluster):
 
     credentials = pika.PlainCredentials('root', 'clickhouse')
     parameters = pika.ConnectionParameters('localhost', 5672, '/', credentials)
+
     def produce():
         connection = pika.BlockingConnection(parameters)
         channel = connection.channel()
@@ -582,7 +576,8 @@ def test_rabbitmq_sharding_between_queues_publish(rabbitmq_cluster):
         for message in messages:
             current += 1
             mes_id = str(current)
-            channel.basic_publish(exchange='test_sharding', routing_key='', properties=pika.BasicProperties(message_id=mes_id), body=message)
+            channel.basic_publish(exchange='test_sharding', routing_key='',
+                                  properties=pika.BasicProperties(message_id=mes_id), body=message)
         connection.close()
 
     threads = []
@@ -612,7 +607,6 @@ def test_rabbitmq_sharding_between_queues_publish(rabbitmq_cluster):
 
 @pytest.mark.timeout(420)
 def test_rabbitmq_mv_combo(rabbitmq_cluster):
-
     NUM_MV = 5
     NUM_CONSUMERS = 4
 
@@ -646,6 +640,7 @@ def test_rabbitmq_mv_combo(rabbitmq_cluster):
 
     credentials = pika.PlainCredentials('root', 'clickhouse')
     parameters = pika.ConnectionParameters('localhost', 5672, '/', credentials)
+
     def produce():
         connection = pika.BlockingConnection(parameters)
         channel = connection.channel()
@@ -656,7 +651,7 @@ def test_rabbitmq_mv_combo(rabbitmq_cluster):
             i[0] += 1
         for msg_id in range(messages_num):
             channel.basic_publish(exchange='combo', routing_key='',
-                properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
+                                  properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
         connection.close()
 
     threads = []
@@ -685,7 +680,6 @@ def test_rabbitmq_mv_combo(rabbitmq_cluster):
             DROP TABLE test.combo_{0};
         '''.format(mv_id))
 
-
     assert int(result) == messages_num * threads_num * NUM_MV, 'ClickHouse lost some messages: {}'.format(result)
 
 
@@ -727,6 +721,7 @@ def test_rabbitmq_insert(rabbitmq_cluster):
                 raise
 
     insert_messages = []
+
     def onReceived(channel, method, properties, body):
         i = 0
         insert_messages.append(body.decode())
@@ -762,7 +757,7 @@ def test_rabbitmq_insert_headers_exchange(rabbitmq_cluster):
     result = consumer.queue_declare(queue='')
     queue_name = result.method.queue
     consumer.queue_bind(exchange='insert_headers', queue=queue_name, routing_key="",
-            arguments={'x-match':'all', 'test':'insert', 'topic':'headers'})
+                        arguments={'x-match': 'all', 'test': 'insert', 'topic': 'headers'})
 
     values = []
     for i in range(50):
@@ -780,6 +775,7 @@ def test_rabbitmq_insert_headers_exchange(rabbitmq_cluster):
                 raise
 
     insert_messages = []
+
     def onReceived(channel, method, properties, body):
         i = 0
         insert_messages.append(body.decode())
@@ -826,6 +822,7 @@ def test_rabbitmq_many_inserts(rabbitmq_cluster):
     ''')
 
     messages_num = 1000
+
     def insert():
         values = []
         for i in range(messages_num):
@@ -904,6 +901,7 @@ def test_rabbitmq_overloaded_insert(rabbitmq_cluster):
     ''')
 
     messages_num = 100000
+
     def insert():
         values = []
         for i in range(messages_num):
@@ -997,8 +995,8 @@ def test_rabbitmq_direct_exchange(rabbitmq_cluster):
         for message in messages:
             mes_id = str(randrange(10))
             channel.basic_publish(
-                    exchange='direct_exchange_testing', routing_key=key,
-                    properties=pika.BasicProperties(message_id=mes_id), body=message)
+                exchange='direct_exchange_testing', routing_key=key,
+                properties=pika.BasicProperties(message_id=mes_id), body=message)
 
     connection.close()
 
@@ -1065,7 +1063,7 @@ def test_rabbitmq_fanout_exchange(rabbitmq_cluster):
 
     for msg_id in range(messages_num):
         channel.basic_publish(exchange='fanout_exchange_testing', routing_key='',
-                properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
+                              properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
 
     connection.close()
 
@@ -1160,7 +1158,7 @@ def test_rabbitmq_topic_exchange(rabbitmq_cluster):
     current = 0
     for msg_id in range(messages_num):
         channel.basic_publish(exchange='topic_exchange_testing', routing_key=key,
-                properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
+                              properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
 
     connection.close()
 
@@ -1180,7 +1178,9 @@ def test_rabbitmq_topic_exchange(rabbitmq_cluster):
         DROP TABLE test.destination;
     ''')
 
-    assert int(result) == messages_num * num_tables + messages_num * num_tables, 'ClickHouse lost some messages: {}'.format(result)
+    assert int(
+        result) == messages_num * num_tables + messages_num * num_tables, 'ClickHouse lost some messages: {}'.format(
+        result)
 
 
 @pytest.mark.timeout(420)
@@ -1228,7 +1228,7 @@ def test_rabbitmq_hash_exchange(rabbitmq_cluster):
             i[0] += 1
         for msg_id in range(messages_num):
             channel.basic_publish(exchange='hash_exchange_testing', routing_key=str(msg_id),
-                properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
+                                  properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
         connection.close()
 
     threads = []
@@ -1267,7 +1267,6 @@ def test_rabbitmq_hash_exchange(rabbitmq_cluster):
     assert int(result2) == 4 * num_tables
 
 
-
 @pytest.mark.timeout(420)
 def test_rabbitmq_multiple_bindings(rabbitmq_cluster):
     instance.query('''
@@ -1402,14 +1401,15 @@ def test_rabbitmq_headers_exchange(rabbitmq_cluster):
         messages.append(json.dumps({'key': i[0], 'value': i[0]}))
         i[0] += 1
 
-    fields={}
-    fields['format']='logs'
-    fields['type']='report'
-    fields['year']='2020'
+    fields = {}
+    fields['format'] = 'logs'
+    fields['type'] = 'report'
+    fields['year'] = '2020'
 
     for msg_id in range(messages_num):
         channel.basic_publish(exchange='headers_exchange_testing', routing_key='',
-                properties=pika.BasicProperties(headers=fields, message_id=str(msg_id)), body=messages[msg_id])
+                              properties=pika.BasicProperties(headers=fields, message_id=str(msg_id)),
+                              body=messages[msg_id])
 
     connection.close()
 
@@ -1535,7 +1535,8 @@ def test_rabbitmq_virtual_columns_with_materialized_view(rabbitmq_cluster):
 
     connection.close()
 
-    result = instance.query("SELECT key, value, exchange_name, SUBSTRING(channel_id, 1, 3), delivery_tag, redelivered FROM test.view ORDER BY delivery_tag")
+    result = instance.query(
+        "SELECT key, value, exchange_name, SUBSTRING(channel_id, 1, 3), delivery_tag, redelivered FROM test.view ORDER BY delivery_tag")
     expected = '''\
 0	0	virtuals_mv	1_0	1	0
 1	1	virtuals_mv	1_0	2	0
@@ -1591,6 +1592,7 @@ def test_rabbitmq_many_consumers_to_each_queue(rabbitmq_cluster):
 
     credentials = pika.PlainCredentials('root', 'clickhouse')
     parameters = pika.ConnectionParameters('localhost', 5672, '/', credentials)
+
     def produce():
         connection = pika.BlockingConnection(parameters)
         channel = connection.channel()
@@ -1601,7 +1603,7 @@ def test_rabbitmq_many_consumers_to_each_queue(rabbitmq_cluster):
             i[0] += 1
         for msg_id in range(messages_num):
             channel.basic_publish(exchange='many_consumers', routing_key='',
-                    properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
+                                  properties=pika.BasicProperties(message_id=str(msg_id)), body=messages[msg_id])
         connection.close()
 
     threads = []
@@ -1739,7 +1741,7 @@ def test_rabbitmq_restore_failed_connection_without_losses_2(rabbitmq_cluster):
         i += 1
     for msg_id in range(messages_num):
         channel.basic_publish(exchange='consumer_reconnect', routing_key='', body=messages[msg_id],
-                properties=pika.BasicProperties(delivery_mode = 2, message_id=str(msg_id)))
+                              properties=pika.BasicProperties(delivery_mode=2, message_id=str(msg_id)))
     connection.close()
 
     instance.query('''
@@ -1759,12 +1761,12 @@ def test_rabbitmq_restore_failed_connection_without_losses_2(rabbitmq_cluster):
     time.sleep(8)
     revive_rabbitmq()
 
-    #while int(instance.query('SELECT count() FROM test.view')) == 0:
+    # while int(instance.query('SELECT count() FROM test.view')) == 0:
     #    time.sleep(0.1)
 
-    #kill_rabbitmq()
-    #time.sleep(2)
-    #revive_rabbitmq()
+    # kill_rabbitmq()
+    # time.sleep(2)
+    # revive_rabbitmq()
 
     while True:
         result = instance.query('SELECT count(DISTINCT key) FROM test.view')
@@ -1808,6 +1810,7 @@ def test_rabbitmq_commit_on_block_write(rabbitmq_cluster):
     cancel = threading.Event()
 
     i = [0]
+
     def produce():
         while not cancel.is_set():
             messages = []
diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index af530808e27..e39296525d0 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -1,14 +1,12 @@
 import json
 import logging
+import os
 import random
 import threading
-import os
-
-import pytest
-
-from helpers.cluster import ClickHouseCluster, ClickHouseInstance
 
 import helpers.client
+import pytest
+from helpers.cluster import ClickHouseCluster, ClickHouseInstance
 
 logging.getLogger().setLevel(logging.INFO)
 logging.getLogger().addHandler(logging.StreamHandler())
@@ -292,7 +290,7 @@ def test_s3_glob_scheherazade(cluster):
                     cluster.minio_host, cluster.minio_port, bucket, path, table_format, values)
                 run_query(instance, query)
 
-        jobs.append(threading.Thread(target=add_tales, args=(night, min(night+nights_per_job, 1001))))
+        jobs.append(threading.Thread(target=add_tales, args=(night, min(night + nights_per_job, 1001))))
         jobs[-1].start()
 
     for job in jobs:
@@ -313,9 +311,10 @@ def run_s3_mock(cluster):
 
 
 def test_custom_auth_headers(cluster):
-    ping_response = cluster.exec_in_container(cluster.get_container_id('resolver'), ["curl", "-s", "http://resolver:8080"])
+    ping_response = cluster.exec_in_container(cluster.get_container_id('resolver'),
+                                              ["curl", "-s", "http://resolver:8080"])
     assert ping_response == 'OK', 'Expected "OK", but got "{}"'.format(ping_response)
-    
+
     table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
     filename = "test.csv"
     get_query = "select * from s3('http://resolver:8080/{bucket}/{file}', 'CSV', '{table_format}')".format(
@@ -345,4 +344,3 @@ def test_infinite_redirect(cluster):
         exception_raised = True
     finally:
         assert exception_raised
-
diff --git a/tests/integration/test_system_merges/test.py b/tests/integration/test_system_merges/test.py
index 15e5b1c0835..07e6f7331d9 100644
--- a/tests/integration/test_system_merges/test.py
+++ b/tests/integration/test_system_merges/test.py
@@ -1,19 +1,20 @@
-import pytest
 import threading
 import time
+
+import pytest
 from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1',
-            main_configs=['configs/logs_config.xml'],
-            with_zookeeper=True,
-            macros={"shard": 0, "replica": 1} )
+                             main_configs=['configs/logs_config.xml'],
+                             with_zookeeper=True,
+                             macros={"shard": 0, "replica": 1})
 
 node2 = cluster.add_instance('node2',
-            main_configs=['configs/logs_config.xml'],
-            with_zookeeper=True,
-            macros={"shard": 0, "replica": 2} )
+                             main_configs=['configs/logs_config.xml'],
+                             with_zookeeper=True,
+                             macros={"shard": 0, "replica": 2})
 
 
 @pytest.fixture(scope="module")
@@ -29,7 +30,7 @@ def started_cluster():
 
 
 def split_tsv(data):
-    return [ x.split("\t") for x in data.splitlines() ]
+    return [x.split("\t") for x in data.splitlines()]
 
 
 @pytest.mark.parametrize("replicated", [
@@ -62,8 +63,8 @@ def test_merge_simple(started_cluster, replicated):
         node1.query("INSERT INTO {name} VALUES (2)".format(name=name))
         node1.query("INSERT INTO {name} VALUES (3)".format(name=name))
 
-        parts = ["all_{}_{}_0".format(x, x) for x in range(starting_block, starting_block+3)]
-        result_part = "all_{}_{}_1".format(starting_block, starting_block+2)
+        parts = ["all_{}_{}_0".format(x, x) for x in range(starting_block, starting_block + 3)]
+        result_part = "all_{}_{}_1".format(starting_block, starting_block + 2)
 
         def optimize():
             node1.query("OPTIMIZE TABLE {name}".format(name=name))
@@ -84,7 +85,8 @@ def test_merge_simple(started_cluster, replicated):
                 table_name,
                 "3",
                 "['{}','{}','{}']".format(*parts),
-                "['{clickhouse}/{table_path}/{}/','{clickhouse}/{table_path}/{}/','{clickhouse}/{table_path}/{}/']".format(*parts, clickhouse=clickhouse_path, table_path=table_path),
+                "['{clickhouse}/{table_path}/{}/','{clickhouse}/{table_path}/{}/','{clickhouse}/{table_path}/{}/']".format(
+                    *parts, clickhouse=clickhouse_path, table_path=table_path),
                 result_part,
                 "{clickhouse}/{table_path}/{}/".format(result_part, clickhouse=clickhouse_path, table_path=table_path),
                 "all",
@@ -129,7 +131,7 @@ def test_mutation_simple(started_cluster, replicated):
 
         node1.query("INSERT INTO {name} VALUES (1)".format(name=name))
         part = "all_{}_{}_0".format(starting_block, starting_block)
-        result_part = "all_{}_{}_0_{}".format(starting_block, starting_block, starting_block+1)
+        result_part = "all_{}_{}_0_{}".format(starting_block, starting_block, starting_block + 1)
 
         def alter():
             node1.query("ALTER TABLE {name} UPDATE a = 42 WHERE sleep(2) OR 1".format(name=name))
diff --git a/tests/integration/test_system_queries/test.py b/tests/integration/test_system_queries/test.py
index db9cf5ccf3c..18a164da805 100644
--- a/tests/integration/test_system_queries/test.py
+++ b/tests/integration/test_system_queries/test.py
@@ -1,11 +1,10 @@
 import os
-import os.path as p
 import sys
 import time
-import datetime
-import pytest
 from contextlib import contextmanager
 
+import pytest
+
 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
@@ -18,8 +17,10 @@ def started_cluster():
     global instance
     try:
         cluster = ClickHouseCluster(__file__)
-        cluster.add_instance('ch1', main_configs=["configs/config.d/clusters_config.xml", "configs/config.d/query_log.xml"],
-            dictionaries=["configs/dictionaries/dictionary_clickhouse_cache.xml", "configs/dictionaries/dictionary_clickhouse_flat.xml"])
+        cluster.add_instance('ch1',
+                             main_configs=["configs/config.d/clusters_config.xml", "configs/config.d/query_log.xml"],
+                             dictionaries=["configs/dictionaries/dictionary_clickhouse_cache.xml",
+                                           "configs/dictionaries/dictionary_clickhouse_flat.xml"])
         cluster.start()
 
         instance = cluster.instances['ch1']
@@ -39,20 +40,32 @@ def test_SYSTEM_RELOAD_DICTIONARY(started_cluster):
     instance = cluster.instances['ch1']
 
     instance.query("SYSTEM RELOAD DICTIONARIES")
-    assert TSV(instance.query("SELECT dictHas('clickhouse_flat', toUInt64(0)), dictHas('clickhouse_flat', toUInt64(1))")) == TSV("0\t0\n")
+    assert TSV(instance.query(
+        "SELECT dictHas('clickhouse_flat', toUInt64(0)), dictHas('clickhouse_flat', toUInt64(1))")) == TSV("0\t0\n")
 
     instance.query("INSERT INTO dictionary_source VALUES (0, 0)")
-    assert TSV(instance.query("SELECT dictGetUInt8('clickhouse_cache', 'value', toUInt64(0)), dictHas('clickhouse_cache', toUInt64(1))")) == TSV("0\t0\n")
+    assert TSV(instance.query(
+        "SELECT dictGetUInt8('clickhouse_cache', 'value', toUInt64(0)), dictHas('clickhouse_cache', toUInt64(1))")) == TSV(
+        "0\t0\n")
     instance.query("INSERT INTO dictionary_source VALUES (1, 1)")
-    assert TSV(instance.query("SELECT dictGetUInt8('clickhouse_cache', 'value', toUInt64(0)), dictHas('clickhouse_cache', toUInt64(1))")) == TSV("0\t0\n")
+    assert TSV(instance.query(
+        "SELECT dictGetUInt8('clickhouse_cache', 'value', toUInt64(0)), dictHas('clickhouse_cache', toUInt64(1))")) == TSV(
+        "0\t0\n")
 
     instance.query("SYSTEM RELOAD DICTIONARY clickhouse_cache")
-    assert TSV(instance.query("SELECT dictGetUInt8('clickhouse_cache', 'value', toUInt64(0)), dictGetUInt8('clickhouse_cache', 'value', toUInt64(1))")) == TSV("0\t1\n")
-    assert TSV(instance.query("SELECT dictHas('clickhouse_flat', toUInt64(0)), dictHas('clickhouse_flat', toUInt64(1))")) == TSV("0\t0\n")
+    assert TSV(instance.query(
+        "SELECT dictGetUInt8('clickhouse_cache', 'value', toUInt64(0)), dictGetUInt8('clickhouse_cache', 'value', toUInt64(1))")) == TSV(
+        "0\t1\n")
+    assert TSV(instance.query(
+        "SELECT dictHas('clickhouse_flat', toUInt64(0)), dictHas('clickhouse_flat', toUInt64(1))")) == TSV("0\t0\n")
 
     instance.query("SYSTEM RELOAD DICTIONARIES")
-    assert TSV(instance.query("SELECT dictGetUInt8('clickhouse_cache', 'value', toUInt64(0)), dictGetUInt8('clickhouse_cache', 'value', toUInt64(1))")) == TSV("0\t1\n")
-    assert TSV(instance.query("SELECT dictGetUInt8('clickhouse_flat', 'value', toUInt64(0)), dictGetUInt8('clickhouse_flat', 'value', toUInt64(1))")) == TSV("0\t1\n")
+    assert TSV(instance.query(
+        "SELECT dictGetUInt8('clickhouse_cache', 'value', toUInt64(0)), dictGetUInt8('clickhouse_cache', 'value', toUInt64(1))")) == TSV(
+        "0\t1\n")
+    assert TSV(instance.query(
+        "SELECT dictGetUInt8('clickhouse_flat', 'value', toUInt64(0)), dictGetUInt8('clickhouse_flat', 'value', toUInt64(1))")) == TSV(
+        "0\t1\n")
 
 
 def test_DROP_DNS_CACHE(started_cluster):
@@ -61,13 +74,15 @@ def test_DROP_DNS_CACHE(started_cluster):
     instance.exec_in_container(['bash', '-c', 'echo 127.0.0.1 localhost > /etc/hosts'], privileged=True, user='root')
     instance.exec_in_container(['bash', '-c', 'echo ::1 localhost >> /etc/hosts'], privileged=True, user='root')
 
-    instance.exec_in_container(['bash', '-c', 'echo 127.255.255.255 lost_host >> /etc/hosts'], privileged=True, user='root')
+    instance.exec_in_container(['bash', '-c', 'echo 127.255.255.255 lost_host >> /etc/hosts'], privileged=True,
+                               user='root')
     instance.query("SYSTEM DROP DNS CACHE")
 
     with pytest.raises(QueryRuntimeException):
         instance.query("SELECT * FROM remote('lost_host', 'system', 'one')")
 
-    instance.query("CREATE TABLE distributed_lost_host (dummy UInt8) ENGINE = Distributed(lost_host_cluster, 'system', 'one')")
+    instance.query(
+        "CREATE TABLE distributed_lost_host (dummy UInt8) ENGINE = Distributed(lost_host_cluster, 'system', 'one')")
     with pytest.raises(QueryRuntimeException):
         instance.query("SELECT * FROM distributed_lost_host")
 
@@ -79,11 +94,12 @@ def test_DROP_DNS_CACHE(started_cluster):
 
     instance.query("SELECT * FROM remote('lost_host', 'system', 'one')")
     instance.query("SELECT * FROM distributed_lost_host")
-    assert TSV(instance.query("SELECT DISTINCT host_name, host_address FROM system.clusters WHERE cluster='lost_host_cluster'")) == TSV("lost_host\t127.0.0.1\n")
+    assert TSV(instance.query(
+        "SELECT DISTINCT host_name, host_address FROM system.clusters WHERE cluster='lost_host_cluster'")) == TSV(
+        "lost_host\t127.0.0.1\n")
 
 
 def test_RELOAD_CONFIG_AND_MACROS(started_cluster):
-
     macros = "<yandex><macros><mac>ro</mac></macros></yandex>"
     create_macros = 'echo "{}" > /etc/clickhouse-server/config.d/macros.xml'.format(macros)
 
@@ -120,6 +136,6 @@ def test_SYSTEM_FLUSH_LOGS(started_cluster):
 
 if __name__ == '__main__':
     with contextmanager(started_cluster)() as cluster:
-       for name, instance in cluster.instances.items():
-           print name, instance.ip_address
-       raw_input("Cluster created, press any key to destroy...")
+        for name, instance in cluster.instances.items():
+            print name, instance.ip_address
+        raw_input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_text_log_level/test.py b/tests/integration/test_text_log_level/test.py
index 799ae9021cb..44679481266 100644
--- a/tests/integration/test_text_log_level/test.py
+++ b/tests/integration/test_text_log_level/test.py
@@ -2,14 +2,14 @@
 # pylint: disable=redefined-outer-name
 
 import pytest
-
-from helpers.cluster import ClickHouseCluster
 from helpers.client import QueryRuntimeException
+from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 
 node = cluster.add_instance('node', main_configs=["configs/config.d/text_log.xml"])
 
+
 @pytest.fixture(scope='module')
 def start_cluster():
     try:
@@ -19,6 +19,7 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_basic(start_cluster):
     with pytest.raises(QueryRuntimeException):
         # generates log with "Error" level
diff --git a/tests/integration/test_timezone_config/test.py b/tests/integration/test_timezone_config/test.py
index 22e11daa72e..ac12eddc709 100644
--- a/tests/integration/test_timezone_config/test.py
+++ b/tests/integration/test_timezone_config/test.py
@@ -5,6 +5,7 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', main_configs=['configs/config.xml'])
 
+
 @pytest.fixture(scope="module")
 def start_cluster():
     try:
@@ -13,5 +14,6 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_check_timezone_config(start_cluster):
     assert node.query("SELECT toDateTime(1111111111)") == "2005-03-17 17:58:31\n"
diff --git a/tests/integration/test_tmp_policy/test.py b/tests/integration/test_tmp_policy/test.py
index 728c62d82fb..f7174c3b695 100644
--- a/tests/integration/test_tmp_policy/test.py
+++ b/tests/integration/test_tmp_policy/test.py
@@ -8,8 +8,9 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 
 node = cluster.add_instance('node',
-            main_configs=["configs/config.d/storage_configuration.xml"],
-            tmpfs=['/disk1:size=100M', '/disk2:size=100M'])
+                            main_configs=["configs/config.d/storage_configuration.xml"],
+                            tmpfs=['/disk1:size=100M', '/disk2:size=100M'])
+
 
 @pytest.fixture(scope='module')
 def start_cluster():
@@ -19,11 +20,12 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 def test_different_versions(start_cluster):
     query = 'SELECT count(ignore(*)) FROM (SELECT * FROM system.numbers LIMIT 1e7) GROUP BY number'
     settings = {
-        'max_bytes_before_external_group_by': 1<<20,
-        'max_bytes_before_external_sort':     1<<20,
+        'max_bytes_before_external_group_by': 1 << 20,
+        'max_bytes_before_external_sort': 1 << 20,
     }
 
     assert node.contains_in_log('Setting up /disk1/ to store temporary data in it')
diff --git a/tests/integration/test_ttl_move/test.py b/tests/integration/test_ttl_move/test.py
index d0db52287ca..ad822bc6545 100644
--- a/tests/integration/test_ttl_move/test.py
+++ b/tests/integration/test_ttl_move/test.py
@@ -1,29 +1,30 @@
-import json
-import pytest
 import random
-import re
 import string
 import threading
 import time
 from multiprocessing.dummy import Pool
+
+import pytest
 from helpers.client import QueryRuntimeException
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
-
 
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance('node1',
-            main_configs=['configs/logs_config.xml', "configs/config.d/instant_moves.xml", "configs/config.d/storage_configuration.xml", "configs/config.d/cluster.xml",],
-            with_zookeeper=True,
-            tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/external:size=200M'],
-            macros={"shard": 0, "replica": 1} )
+                             main_configs=['configs/logs_config.xml', "configs/config.d/instant_moves.xml",
+                                           "configs/config.d/storage_configuration.xml",
+                                           "configs/config.d/cluster.xml", ],
+                             with_zookeeper=True,
+                             tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/external:size=200M'],
+                             macros={"shard": 0, "replica": 1})
 
 node2 = cluster.add_instance('node2',
-            main_configs=['configs/logs_config.xml', "configs/config.d/instant_moves.xml", "configs/config.d/storage_configuration.xml", "configs/config.d/cluster.xml",],
-            with_zookeeper=True,
-            tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/external:size=200M'],
-            macros={"shard": 0, "replica": 2} )
+                             main_configs=['configs/logs_config.xml', "configs/config.d/instant_moves.xml",
+                                           "configs/config.d/storage_configuration.xml",
+                                           "configs/config.d/cluster.xml", ],
+                             with_zookeeper=True,
+                             tmpfs=['/jbod1:size=40M', '/jbod2:size=40M', '/external:size=200M'],
+                             macros={"shard": 0, "replica": 2})
 
 
 @pytest.fixture(scope="module")
@@ -38,7 +39,7 @@ def started_cluster():
 
 def get_random_string(length):
     symbols = bytes(string.ascii_uppercase + string.digits)
-    result_list = bytearray([0])*length
+    result_list = bytearray([0]) * length
     for i in range(length):
         result_list[i] = random.choice(symbols)
     return str(result_list)
@@ -56,6 +57,7 @@ def get_used_disks_for_table(node, table_name, partition=None):
         ORDER BY modification_time
     """.format(name=table_name, suffix=suffix)).strip().split('\n')
 
+
 def check_used_disks_with_retry(node, table_name, expected_disks, retries):
     for _ in range(retries):
         used_disks = get_used_disks_for_table(node, table_name)
@@ -64,11 +66,14 @@ def check_used_disks_with_retry(node, table_name, expected_disks, retries):
         time.sleep(0.5)
     return False
 
+
 @pytest.mark.parametrize("name,engine,alter", [
-    ("mt_test_rule_with_invalid_destination","MergeTree()",0),
-    ("replicated_mt_test_rule_with_invalid_destination","ReplicatedMergeTree('/clickhouse/replicated_test_rule_with_invalid_destination', '1')",0),
-    ("mt_test_rule_with_invalid_destination","MergeTree()",1),
-    ("replicated_mt_test_rule_with_invalid_destination","ReplicatedMergeTree('/clickhouse/replicated_test_rule_with_invalid_destination', '1')",1),
+    ("mt_test_rule_with_invalid_destination", "MergeTree()", 0),
+    ("replicated_mt_test_rule_with_invalid_destination",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_rule_with_invalid_destination', '1')", 0),
+    ("mt_test_rule_with_invalid_destination", "MergeTree()", 1),
+    ("replicated_mt_test_rule_with_invalid_destination",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_rule_with_invalid_destination', '1')", 1),
 ])
 def test_rule_with_invalid_destination(started_cluster, name, engine, alter):
     try:
@@ -124,10 +129,12 @@ def test_rule_with_invalid_destination(started_cluster, name, engine, alter):
 
 
 @pytest.mark.parametrize("name,engine,positive", [
-    ("mt_test_inserts_to_disk_do_not_work","MergeTree()",0),
-    ("replicated_mt_test_inserts_to_disk_do_not_work","ReplicatedMergeTree('/clickhouse/replicated_test_inserts_to_disk_do_not_work', '1')",0),
-    ("mt_test_inserts_to_disk_work","MergeTree()",1),
-    ("replicated_mt_test_inserts_to_disk_work","ReplicatedMergeTree('/clickhouse/replicated_test_inserts_to_disk_work', '1')",1),
+    ("mt_test_inserts_to_disk_do_not_work", "MergeTree()", 0),
+    ("replicated_mt_test_inserts_to_disk_do_not_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_inserts_to_disk_do_not_work', '1')", 0),
+    ("mt_test_inserts_to_disk_work", "MergeTree()", 1),
+    ("replicated_mt_test_inserts_to_disk_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_inserts_to_disk_work', '1')", 1),
 ])
 def test_inserts_to_disk_work(started_cluster, name, engine, positive):
     try:
@@ -141,9 +148,10 @@ def test_inserts_to_disk_work(started_cluster, name, engine, positive):
             SETTINGS storage_policy='small_jbod_with_external'
         """.format(name=name, engine=engine))
 
-        data = [] # 10MB in total
+        data = []  # 10MB in total
         for i in range(10):
-            data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time.time()-1 if i > 0 or positive else time.time()+300))) # 1MB row
+            data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(
+                time.time() - 1 if i > 0 or positive else time.time() + 300)))  # 1MB row
 
         node1.query("INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
         used_disks = get_used_disks_for_table(node1, name)
@@ -159,8 +167,9 @@ def test_inserts_to_disk_work(started_cluster, name, engine, positive):
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("mt_test_moves_work_after_storage_policy_change","MergeTree()"),
-    ("replicated_mt_test_moves_work_after_storage_policy_change","ReplicatedMergeTree('/clickhouse/test_moves_work_after_storage_policy_change', '1')"),
+    ("mt_test_moves_work_after_storage_policy_change", "MergeTree()"),
+    ("replicated_mt_test_moves_work_after_storage_policy_change",
+     "ReplicatedMergeTree('/clickhouse/test_moves_work_after_storage_policy_change', '1')"),
 ])
 def test_moves_work_after_storage_policy_change(started_cluster, name, engine):
     try:
@@ -172,10 +181,13 @@ def test_moves_work_after_storage_policy_change(started_cluster, name, engine):
             ORDER BY tuple()
         """.format(name=name, engine=engine))
 
-        node1.query("""ALTER TABLE {name} MODIFY SETTING storage_policy='default_with_small_jbod_with_external'""".format(name=name))
+        node1.query(
+            """ALTER TABLE {name} MODIFY SETTING storage_policy='default_with_small_jbod_with_external'""".format(
+                name=name))
 
         # Second expression is preferred because d1 > now()-3600.
-        node1.query("""ALTER TABLE {name} MODIFY TTL now()-3600 TO DISK 'jbod1', d1 TO DISK 'external'""".format(name=name))
+        node1.query(
+            """ALTER TABLE {name} MODIFY TTL now()-3600 TO DISK 'jbod1', d1 TO DISK 'external'""".format(name=name))
 
         wait_expire_1 = 12
         wait_expire_2 = 4
@@ -185,16 +197,16 @@ def test_moves_work_after_storage_policy_change(started_cluster, name, engine):
         wait_expire_1_thread = threading.Thread(target=time.sleep, args=(wait_expire_1,))
         wait_expire_1_thread.start()
 
-        data = [] # 10MB in total
+        data = []  # 10MB in total
         for i in range(10):
-            data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1))) # 1MB row
+            data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1)))  # 1MB row
 
         node1.query("INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"jbod1"}
 
         wait_expire_1_thread.join()
-        time.sleep(wait_expire_2/2)
+        time.sleep(wait_expire_2 / 2)
 
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"external"}
@@ -206,10 +218,12 @@ def test_moves_work_after_storage_policy_change(started_cluster, name, engine):
 
 
 @pytest.mark.parametrize("name,engine,positive", [
-    ("mt_test_moves_to_disk_do_not_work","MergeTree()",0),
-    ("replicated_mt_test_moves_to_disk_do_not_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_to_disk_do_not_work', '1')",0),
-    ("mt_test_moves_to_disk_work","MergeTree()",1),
-    ("replicated_mt_test_moves_to_disk_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_to_disk_work', '1')",1),
+    ("mt_test_moves_to_disk_do_not_work", "MergeTree()", 0),
+    ("replicated_mt_test_moves_to_disk_do_not_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_to_disk_do_not_work', '1')", 0),
+    ("mt_test_moves_to_disk_work", "MergeTree()", 1),
+    ("replicated_mt_test_moves_to_disk_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_to_disk_work', '1')", 1),
 ])
 def test_moves_to_disk_work(started_cluster, name, engine, positive):
     try:
@@ -231,16 +245,17 @@ def test_moves_to_disk_work(started_cluster, name, engine, positive):
         wait_expire_1_thread = threading.Thread(target=time.sleep, args=(wait_expire_1,))
         wait_expire_1_thread.start()
 
-        data = [] # 10MB in total
+        data = []  # 10MB in total
         for i in range(10):
-            data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1 if i > 0 or positive else time_2))) # 1MB row
+            data.append(("'{}'".format(get_random_string(1024 * 1024)),
+                         "toDateTime({})".format(time_1 if i > 0 or positive else time_2)))  # 1MB row
 
         node1.query("INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"jbod1"}
 
         wait_expire_1_thread.join()
-        time.sleep(wait_expire_2/2)
+        time.sleep(wait_expire_2 / 2)
 
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"external" if positive else "jbod1"}
@@ -252,8 +267,9 @@ def test_moves_to_disk_work(started_cluster, name, engine, positive):
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("mt_test_moves_to_volume_work","MergeTree()"),
-    ("replicated_mt_test_moves_to_volume_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_to_volume_work', '1')"),
+    ("mt_test_moves_to_volume_work", "MergeTree()"),
+    ("replicated_mt_test_moves_to_volume_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_to_volume_work', '1')"),
 ])
 def test_moves_to_volume_work(started_cluster, name, engine):
     try:
@@ -276,11 +292,13 @@ def test_moves_to_volume_work(started_cluster, name, engine):
         wait_expire_1_thread.start()
 
         for p in range(2):
-            data = [] # 10MB in total
+            data = []  # 10MB in total
             for i in range(5):
-                data.append((str(p), "'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1))) # 1MB row
+                data.append(
+                    (str(p), "'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1)))  # 1MB row
 
-            node1.query("INSERT INTO {} (p1, s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
+            node1.query(
+                "INSERT INTO {} (p1, s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
 
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {'jbod1', 'jbod2'}
@@ -298,10 +316,12 @@ def test_moves_to_volume_work(started_cluster, name, engine):
 
 
 @pytest.mark.parametrize("name,engine,positive", [
-    ("mt_test_inserts_to_volume_do_not_work","MergeTree()",0),
-    ("replicated_mt_test_inserts_to_volume_do_not_work","ReplicatedMergeTree('/clickhouse/replicated_test_inserts_to_volume_do_not_work', '1')",0),
-    ("mt_test_inserts_to_volume_work","MergeTree()",1),
-    ("replicated_mt_test_inserts_to_volume_work","ReplicatedMergeTree('/clickhouse/replicated_test_inserts_to_volume_work', '1')",1),
+    ("mt_test_inserts_to_volume_do_not_work", "MergeTree()", 0),
+    ("replicated_mt_test_inserts_to_volume_do_not_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_inserts_to_volume_do_not_work', '1')", 0),
+    ("mt_test_inserts_to_volume_work", "MergeTree()", 1),
+    ("replicated_mt_test_inserts_to_volume_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_inserts_to_volume_work', '1')", 1),
 ])
 def test_inserts_to_volume_work(started_cluster, name, engine, positive):
     try:
@@ -320,11 +340,13 @@ def test_inserts_to_volume_work(started_cluster, name, engine, positive):
         node1.query("SYSTEM STOP MOVES {name}".format(name=name))
 
         for p in range(2):
-            data = [] # 20MB in total
+            data = []  # 20MB in total
             for i in range(10):
-                data.append((str(p), "'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time.time()-1 if i > 0 or positive else time.time()+300))) # 1MB row
+                data.append((str(p), "'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(
+                    time.time() - 1 if i > 0 or positive else time.time() + 300)))  # 1MB row
 
-            node1.query("INSERT INTO {} (p1, s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
+            node1.query(
+                "INSERT INTO {} (p1, s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
 
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"external" if positive else "jbod1"}
@@ -336,8 +358,9 @@ def test_inserts_to_volume_work(started_cluster, name, engine, positive):
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("mt_test_moves_to_disk_eventually_work","MergeTree()"),
-    ("replicated_mt_test_moves_to_disk_eventually_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_to_disk_eventually_work', '1')"),
+    ("mt_test_moves_to_disk_eventually_work", "MergeTree()"),
+    ("replicated_mt_test_moves_to_disk_eventually_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_to_disk_eventually_work', '1')"),
 ])
 def test_moves_to_disk_eventually_work(started_cluster, name, engine):
     try:
@@ -351,9 +374,9 @@ def test_moves_to_disk_eventually_work(started_cluster, name, engine):
             SETTINGS storage_policy='only_jbod2'
         """.format(name=name_temp))
 
-        data = [] # 35MB in total
+        data = []  # 35MB in total
         for i in range(35):
-            data.append(get_random_string(1024 * 1024)) # 1MB row
+            data.append(get_random_string(1024 * 1024))  # 1MB row
 
         node1.query("INSERT INTO {} VALUES {}".format(name_temp, ",".join(["('" + x + "')" for x in data])))
         used_disks = get_used_disks_for_table(node1, name_temp)
@@ -369,9 +392,10 @@ def test_moves_to_disk_eventually_work(started_cluster, name, engine):
             SETTINGS storage_policy='jbod1_with_jbod2'
         """.format(name=name, engine=engine))
 
-        data = [] # 10MB in total
+        data = []  # 10MB in total
         for i in range(10):
-            data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time.time()-1))) # 1MB row
+            data.append(
+                ("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time.time() - 1)))  # 1MB row
 
         node1.query("INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
         used_disks = get_used_disks_for_table(node1, name)
@@ -407,7 +431,8 @@ def test_replicated_download_ttl_info(started_cluster):
 
         node1.query("SYSTEM STOP MOVES {}".format(name))
 
-        node2.query("INSERT INTO {} (s1, d1) VALUES ('{}', toDateTime({}))".format(name, get_random_string(1024 * 1024), time.time()-100))
+        node2.query("INSERT INTO {} (s1, d1) VALUES ('{}', toDateTime({}))".format(name, get_random_string(1024 * 1024),
+                                                                                   time.time() - 100))
 
         assert set(get_used_disks_for_table(node2, name)) == {"external"}
         time.sleep(1)
@@ -424,10 +449,12 @@ def test_replicated_download_ttl_info(started_cluster):
 
 
 @pytest.mark.parametrize("name,engine,positive", [
-    ("mt_test_merges_to_disk_do_not_work","MergeTree()",0),
-    ("replicated_mt_test_merges_to_disk_do_not_work","ReplicatedMergeTree('/clickhouse/replicated_test_merges_to_disk_do_not_work', '1')",0),
-    ("mt_test_merges_to_disk_work","MergeTree()",1),
-    ("replicated_mt_test_merges_to_disk_work","ReplicatedMergeTree('/clickhouse/replicated_test_merges_to_disk_work', '1')",1),
+    ("mt_test_merges_to_disk_do_not_work", "MergeTree()", 0),
+    ("replicated_mt_test_merges_to_disk_do_not_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_merges_to_disk_do_not_work', '1')", 0),
+    ("mt_test_merges_to_disk_work", "MergeTree()", 1),
+    ("replicated_mt_test_merges_to_disk_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_merges_to_disk_work', '1')", 1),
 ])
 def test_merges_to_disk_work(started_cluster, name, engine, positive):
     try:
@@ -453,18 +480,21 @@ def test_merges_to_disk_work(started_cluster, name, engine, positive):
         wait_expire_1_thread.start()
 
         for _ in range(2):
-            data = [] # 16MB in total
+            data = []  # 16MB in total
             for i in range(8):
-                data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1 if i > 0 or positive else time_2))) # 1MB row
+                data.append(("'{}'".format(get_random_string(1024 * 1024)),
+                             "toDateTime({})".format(time_1 if i > 0 or positive else time_2)))  # 1MB row
 
-            node1.query("INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
+            node1.query(
+                "INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
 
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"jbod1"}
-        assert "2" == node1.query("SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
+        assert "2" == node1.query(
+            "SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
 
         wait_expire_1_thread.join()
-        time.sleep(wait_expire_2/2)
+        time.sleep(wait_expire_2 / 2)
 
         node1.query("SYSTEM START MERGES {}".format(name))
         node1.query("OPTIMIZE TABLE {}".format(name))
@@ -472,7 +502,8 @@ def test_merges_to_disk_work(started_cluster, name, engine, positive):
         time.sleep(1)
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"external" if positive else "jbod1"}
-        assert "1" == node1.query("SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
+        assert "1" == node1.query(
+            "SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
 
         assert node1.query("SELECT count() FROM {name}".format(name=name)).strip() == "16"
 
@@ -481,8 +512,9 @@ def test_merges_to_disk_work(started_cluster, name, engine, positive):
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("mt_test_merges_with_full_disk_work","MergeTree()"),
-    ("replicated_mt_test_merges_with_full_disk_work","ReplicatedMergeTree('/clickhouse/replicated_test_merges_with_full_disk_work', '1')"),
+    ("mt_test_merges_with_full_disk_work", "MergeTree()"),
+    ("replicated_mt_test_merges_with_full_disk_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_merges_with_full_disk_work', '1')"),
 ])
 def test_merges_with_full_disk_work(started_cluster, name, engine):
     try:
@@ -496,9 +528,9 @@ def test_merges_with_full_disk_work(started_cluster, name, engine):
             SETTINGS storage_policy='only_jbod2'
         """.format(name=name_temp))
 
-        data = [] # 35MB in total
+        data = []  # 35MB in total
         for i in range(35):
-            data.append(get_random_string(1024 * 1024)) # 1MB row
+            data.append(get_random_string(1024 * 1024))  # 1MB row
 
         node1.query("INSERT INTO {} VALUES {}".format(name_temp, ",".join(["('" + x + "')" for x in data])))
         used_disks = get_used_disks_for_table(node1, name_temp)
@@ -521,14 +553,16 @@ def test_merges_with_full_disk_work(started_cluster, name, engine):
         wait_expire_1_thread.start()
 
         for _ in range(2):
-            data = [] # 12MB in total
+            data = []  # 12MB in total
             for i in range(6):
-                data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1))) # 1MB row
-            node1.query("INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
+                data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1)))  # 1MB row
+            node1.query(
+                "INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
 
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"jbod1"}
-        assert "2" == node1.query("SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
+        assert "2" == node1.query(
+            "SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
 
         wait_expire_1_thread.join()
 
@@ -536,8 +570,9 @@ def test_merges_with_full_disk_work(started_cluster, name, engine):
         time.sleep(1)
 
         used_disks = get_used_disks_for_table(node1, name)
-        assert set(used_disks) == {"jbod1"} # Merged to the same disk against the rule.
-        assert "1" == node1.query("SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
+        assert set(used_disks) == {"jbod1"}  # Merged to the same disk against the rule.
+        assert "1" == node1.query(
+            "SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
 
         assert node1.query("SELECT count() FROM {name}".format(name=name)).strip() == "12"
 
@@ -547,10 +582,12 @@ def test_merges_with_full_disk_work(started_cluster, name, engine):
 
 
 @pytest.mark.parametrize("name,engine,positive", [
-    ("mt_test_moves_after_merges_do_not_work","MergeTree()",0),
-    ("replicated_mt_test_moves_after_merges_do_not_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_merges_do_not_work', '1')",0),
-    ("mt_test_moves_after_merges_work","MergeTree()",1),
-    ("replicated_mt_test_moves_after_merges_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_merges_work', '1')",1),
+    ("mt_test_moves_after_merges_do_not_work", "MergeTree()", 0),
+    ("replicated_mt_test_moves_after_merges_do_not_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_merges_do_not_work', '1')", 0),
+    ("mt_test_moves_after_merges_work", "MergeTree()", 1),
+    ("replicated_mt_test_moves_after_merges_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_merges_work', '1')", 1),
 ])
 def test_moves_after_merges_work(started_cluster, name, engine, positive):
     try:
@@ -573,21 +610,24 @@ def test_moves_after_merges_work(started_cluster, name, engine, positive):
         wait_expire_1_thread.start()
 
         for _ in range(2):
-            data = [] # 14MB in total
+            data = []  # 14MB in total
             for i in range(7):
-                data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time_1 if i > 0 or positive else time_2))) # 1MB row
+                data.append(("'{}'".format(get_random_string(1024 * 1024)),
+                             "toDateTime({})".format(time_1 if i > 0 or positive else time_2)))  # 1MB row
 
-            node1.query("INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
+            node1.query(
+                "INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
 
         node1.query("OPTIMIZE TABLE {}".format(name))
         time.sleep(1)
 
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"jbod1"}
-        assert "1" == node1.query("SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
+        assert "1" == node1.query(
+            "SELECT count() FROM system.parts WHERE table = '{}' AND active = 1".format(name)).strip()
 
         wait_expire_1_thread.join()
-        time.sleep(wait_expire_2/2)
+        time.sleep(wait_expire_2 / 2)
 
         used_disks = get_used_disks_for_table(node1, name)
         assert set(used_disks) == {"external" if positive else "jbod1"}
@@ -599,14 +639,18 @@ def test_moves_after_merges_work(started_cluster, name, engine, positive):
 
 
 @pytest.mark.parametrize("name,engine,positive,bar", [
-    ("mt_test_moves_after_alter_do_not_work","MergeTree()",0,"DELETE"),
-    ("replicated_mt_test_moves_after_alter_do_not_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_alter_do_not_work', '1')",0,"DELETE"),
-    ("mt_test_moves_after_alter_work","MergeTree()",1,"DELETE"),
-    ("replicated_mt_test_moves_after_alter_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_alter_work', '1')",1,"DELETE"),
-    ("mt_test_moves_after_alter_do_not_work","MergeTree()",0,"TO DISK 'external'"),
-    ("replicated_mt_test_moves_after_alter_do_not_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_alter_do_not_work', '1')",0,"TO DISK 'external'"),
-    ("mt_test_moves_after_alter_work","MergeTree()",1,"TO DISK 'external'"),
-    ("replicated_mt_test_moves_after_alter_work","ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_alter_work', '1')",1,"TO DISK 'external'"),
+    ("mt_test_moves_after_alter_do_not_work", "MergeTree()", 0, "DELETE"),
+    ("replicated_mt_test_moves_after_alter_do_not_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_alter_do_not_work', '1')", 0, "DELETE"),
+    ("mt_test_moves_after_alter_work", "MergeTree()", 1, "DELETE"),
+    ("replicated_mt_test_moves_after_alter_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_alter_work', '1')", 1, "DELETE"),
+    ("mt_test_moves_after_alter_do_not_work", "MergeTree()", 0, "TO DISK 'external'"),
+    ("replicated_mt_test_moves_after_alter_do_not_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_alter_do_not_work', '1')", 0, "TO DISK 'external'"),
+    ("mt_test_moves_after_alter_work", "MergeTree()", 1, "TO DISK 'external'"),
+    ("replicated_mt_test_moves_after_alter_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_moves_after_alter_work', '1')", 1, "TO DISK 'external'"),
 ])
 def test_ttls_do_not_work_after_alter(started_cluster, name, engine, positive, bar):
     try:
@@ -625,11 +669,12 @@ def test_ttls_do_not_work_after_alter(started_cluster, name, engine, positive, b
                 ALTER TABLE {name}
                     MODIFY TTL
                     d1 + INTERVAL 15 MINUTE {bar}
-            """.format(name=name, bar=bar)) # That shall disable TTL.
+            """.format(name=name, bar=bar))  # That shall disable TTL.
 
-        data = [] # 10MB in total
+        data = []  # 10MB in total
         for i in range(10):
-            data.append(("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time.time()-1))) # 1MB row
+            data.append(
+                ("'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time.time() - 1)))  # 1MB row
         node1.query("INSERT INTO {} (s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
 
         used_disks = get_used_disks_for_table(node1, name)
@@ -642,8 +687,9 @@ def test_ttls_do_not_work_after_alter(started_cluster, name, engine, positive, b
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("mt_test_materialize_ttl_in_partition","MergeTree()"),
-    ("replicated_mt_test_materialize_ttl_in_partition","ReplicatedMergeTree('/clickhouse/test_materialize_ttl_in_partition', '1')"),
+    ("mt_test_materialize_ttl_in_partition", "MergeTree()"),
+    ("replicated_mt_test_materialize_ttl_in_partition",
+     "ReplicatedMergeTree('/clickhouse/test_materialize_ttl_in_partition', '1')"),
 ])
 def test_materialize_ttl_in_partition(started_cluster, name, engine):
     try:
@@ -658,10 +704,12 @@ def test_materialize_ttl_in_partition(started_cluster, name, engine):
             SETTINGS storage_policy='small_jbod_with_external'
         """.format(name=name, engine=engine))
 
-        data = [] # 5MB in total
+        data = []  # 5MB in total
         for i in range(5):
-            data.append((str(i), "'{}'".format(get_random_string(1024 * 1024)), "toDateTime({})".format(time.time()-1))) # 1MB row
-        node1.query("INSERT INTO {} (p1, s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
+            data.append((str(i), "'{}'".format(get_random_string(1024 * 1024)),
+                         "toDateTime({})".format(time.time() - 1)))  # 1MB row
+        node1.query(
+            "INSERT INTO {} (p1, s1, d1) VALUES {}".format(name, ",".join(["(" + ",".join(x) + ")" for x in data])))
 
         time.sleep(0.5)
 
@@ -705,9 +753,11 @@ def test_materialize_ttl_in_partition(started_cluster, name, engine):
 
 @pytest.mark.parametrize("name,engine,positive", [
     ("mt_test_alter_multiple_ttls_positive", "MergeTree()", True),
-    ("mt_replicated_test_alter_multiple_ttls_positive", "ReplicatedMergeTree('/clickhouse/replicated_test_alter_multiple_ttls_positive', '1')", True),
+    ("mt_replicated_test_alter_multiple_ttls_positive",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_alter_multiple_ttls_positive', '1')", True),
     ("mt_test_alter_multiple_ttls_negative", "MergeTree()", False),
-    ("mt_replicated_test_alter_multiple_ttls_negative", "ReplicatedMergeTree('/clickhouse/replicated_test_alter_multiple_ttls_negative', '1')", False),
+    ("mt_replicated_test_alter_multiple_ttls_negative",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_alter_multiple_ttls_negative', '1')", False),
 ])
 def test_alter_multiple_ttls(started_cluster, name, engine, positive):
     """Copyright 2019, Altinity LTD
@@ -754,11 +804,11 @@ limitations under the License."""
         """.format(name=name))
 
         for p in range(3):
-            data = [] # 6MB in total
+            data = []  # 6MB in total
             now = time.time()
             for i in range(2):
                 p1 = p
-                s1 = get_random_string(1024 * 1024) # 1MB
+                s1 = get_random_string(1024 * 1024)  # 1MB
                 d1 = now - 1 if i > 0 or positive else now + 300
                 data.append("({}, '{}', toDateTime({}))".format(p1, s1, d1))
             node1.query("INSERT INTO {name} (p1, s1, d1) VALUES {values}".format(name=name, values=",".join(data)))
@@ -790,7 +840,6 @@ limitations under the License."""
             node1.query("OPTIMIZE TABLE {name} FINAL".format(name=name))
             time.sleep(0.5)
 
-
         if positive:
             assert rows_count == 0
         else:
@@ -801,8 +850,9 @@ limitations under the License."""
 
 
 @pytest.mark.parametrize("name,engine", [
-    ("concurrently_altering_ttl_mt","MergeTree()"),
-    ("concurrently_altering_ttl_replicated_mt","ReplicatedMergeTree('/clickhouse/concurrently_altering_ttl_replicated_mt', '1')",),
+    ("concurrently_altering_ttl_mt", "MergeTree()"),
+    ("concurrently_altering_ttl_replicated_mt",
+     "ReplicatedMergeTree('/clickhouse/concurrently_altering_ttl_replicated_mt', '1')",),
 ])
 def test_concurrent_alter_with_ttl_move(started_cluster, name, engine):
     try:
@@ -816,7 +866,7 @@ def test_concurrent_alter_with_ttl_move(started_cluster, name, engine):
             SETTINGS storage_policy='jbods_with_external'
         """.format(name=name, engine=engine))
 
-        values = list({ random.randint(1, 1000000) for _ in range(0, 1000) })
+        values = list({random.randint(1, 1000000) for _ in range(0, 1000)})
 
         def insert(num):
             for i in range(num):
@@ -831,7 +881,9 @@ def test_concurrent_alter_with_ttl_move(started_cluster, name, engine):
                 if move_type == "PART":
                     for _ in range(10):
                         try:
-                            parts = node1.query("SELECT name from system.parts where table = '{}' and active = 1".format(name)).strip().split('\n')
+                            parts = node1.query(
+                                "SELECT name from system.parts where table = '{}' and active = 1".format(
+                                    name)).strip().split('\n')
                             break
                         except QueryRuntimeException:
                             pass
@@ -864,7 +916,9 @@ def test_concurrent_alter_with_ttl_move(started_cluster, name, engine):
             for i in range(num):
                 ttls = []
                 for j in range(random.randint(1, 10)):
-                    what = random.choice(["TO VOLUME 'main'", "TO VOLUME 'external'", "TO DISK 'jbod1'", "TO DISK 'jbod2'", "TO DISK 'external'"])
+                    what = random.choice(
+                        ["TO VOLUME 'main'", "TO VOLUME 'external'", "TO DISK 'jbod1'", "TO DISK 'jbod2'",
+                         "TO DISK 'external'"])
                     when = "now()+{}".format(random.randint(-1, 5))
                     ttls.append("{} {}".format(when, what))
                 try:
@@ -874,7 +928,7 @@ def test_concurrent_alter_with_ttl_move(started_cluster, name, engine):
 
         def optimize_table(num):
             for i in range(num):
-                try: # optimize may throw after concurrent alter
+                try:  # optimize may throw after concurrent alter
                     node1.query("OPTIMIZE TABLE {} FINAL".format(name), settings={'optimize_throw_if_noop': '1'})
                     break
                 except:
@@ -897,6 +951,7 @@ def test_concurrent_alter_with_ttl_move(started_cluster, name, engine):
     finally:
         node1.query("DROP TABLE IF EXISTS {name} NO DELAY".format(name=name))
 
+
 @pytest.mark.skip(reason="Flacky test")
 @pytest.mark.parametrize("name,positive", [
     ("test_double_move_while_select_negative", 0),
@@ -914,9 +969,11 @@ def test_double_move_while_select(started_cluster, name, positive):
             SETTINGS storage_policy='small_jbod_with_external'
         """.format(name=name))
 
-        node1.query("INSERT INTO {name} VALUES (1, '{string}')".format(name=name, string=get_random_string(10 * 1024 * 1024)))
+        node1.query(
+            "INSERT INTO {name} VALUES (1, '{string}')".format(name=name, string=get_random_string(10 * 1024 * 1024)))
 
-        parts = node1.query("SELECT name FROM system.parts WHERE table = '{name}' AND active = 1".format(name=name)).splitlines()
+        parts = node1.query(
+            "SELECT name FROM system.parts WHERE table = '{name}' AND active = 1".format(name=name)).splitlines()
         assert len(parts) == 1
 
         node1.query("ALTER TABLE {name} MOVE PART '{part}' TO DISK 'external'".format(name=name, part=parts[0]))
@@ -933,14 +990,18 @@ def test_double_move_while_select(started_cluster, name, positive):
         node1.query("ALTER TABLE {name} MOVE PART '{part}' TO DISK 'jbod1'".format(name=name, part=parts[0]))
 
         # Fill jbod1 to force ClickHouse to make move of partition 1 to external.
-        node1.query("INSERT INTO {name} VALUES (2, '{string}')".format(name=name, string=get_random_string(9 * 1024 * 1024)))
-        node1.query("INSERT INTO {name} VALUES (3, '{string}')".format(name=name, string=get_random_string(9 * 1024 * 1024)))
-        node1.query("INSERT INTO {name} VALUES (4, '{string}')".format(name=name, string=get_random_string(9 * 1024 * 1024)))
+        node1.query(
+            "INSERT INTO {name} VALUES (2, '{string}')".format(name=name, string=get_random_string(9 * 1024 * 1024)))
+        node1.query(
+            "INSERT INTO {name} VALUES (3, '{string}')".format(name=name, string=get_random_string(9 * 1024 * 1024)))
+        node1.query(
+            "INSERT INTO {name} VALUES (4, '{string}')".format(name=name, string=get_random_string(9 * 1024 * 1024)))
 
         time.sleep(1)
 
         # If SELECT locked old part on external, move shall fail.
-        assert node1.query("SELECT disk_name FROM system.parts WHERE table = '{name}' AND active = 1 AND name = '{part}'"
+        assert node1.query(
+            "SELECT disk_name FROM system.parts WHERE table = '{name}' AND active = 1 AND name = '{part}'"
                 .format(name=name, part=parts[0])).splitlines() == ["jbod1" if positive else "external"]
 
         thread.join()
@@ -952,10 +1013,12 @@ def test_double_move_while_select(started_cluster, name, positive):
 
 
 @pytest.mark.parametrize("name,engine,positive", [
-    ("mt_test_alter_with_merge_do_not_work","MergeTree()",0),
-    ("replicated_mt_test_alter_with_merge_do_not_work","ReplicatedMergeTree('/clickhouse/replicated_test_alter_with_merge_do_not_work', '1')",0),
-    ("mt_test_alter_with_merge_work","MergeTree()",1),
-    ("replicated_mt_test_alter_with_merge_work","ReplicatedMergeTree('/clickhouse/replicated_test_alter_with_merge_work', '1')",1),
+    ("mt_test_alter_with_merge_do_not_work", "MergeTree()", 0),
+    ("replicated_mt_test_alter_with_merge_do_not_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_alter_with_merge_do_not_work', '1')", 0),
+    ("mt_test_alter_with_merge_work", "MergeTree()", 1),
+    ("replicated_mt_test_alter_with_merge_work",
+     "ReplicatedMergeTree('/clickhouse/replicated_test_alter_with_merge_work', '1')", 1),
 ])
 def test_alter_with_merge_work(started_cluster, name, engine, positive):
     """Copyright 2019, Altinity LTD
@@ -984,20 +1047,19 @@ limitations under the License."""
             SETTINGS storage_policy='jbods_with_external', merge_with_ttl_timeout=0
         """.format(name=name, engine=engine))
 
-
         def optimize_table(num):
             for i in range(num):
-                try: # optimize may throw after concurrent alter
+                try:  # optimize may throw after concurrent alter
                     node1.query("OPTIMIZE TABLE {} FINAL".format(name), settings={'optimize_throw_if_noop': '1'})
                     break
                 except:
                     pass
 
         for p in range(3):
-            data = [] # 6MB in total
+            data = []  # 6MB in total
             now = time.time()
             for i in range(2):
-                s1 = get_random_string(1024 * 1024) # 1MB
+                s1 = get_random_string(1024 * 1024)  # 1MB
                 d1 = now - 1 if positive else now + 300
                 data.append("('{}', toDateTime({}))".format(s1, d1))
             values = ",".join(data)
@@ -1017,7 +1079,8 @@ limitations under the License."""
 
         optimize_table(20)
 
-        assert node1.query("SELECT count() FROM system.parts WHERE table = '{name}' AND active = 1".format(name=name)) == "1\n"
+        assert node1.query(
+            "SELECT count() FROM system.parts WHERE table = '{name}' AND active = 1".format(name=name)) == "1\n"
 
         time.sleep(5)
 
diff --git a/tests/integration/test_ttl_replicated/test.py b/tests/integration/test_ttl_replicated/test.py
index 0f201f569b3..6e988023951 100644
--- a/tests/integration/test_ttl_replicated/test.py
+++ b/tests/integration/test_ttl_replicated/test.py
@@ -1,11 +1,10 @@
 import time
-import pytest
 
 import helpers.client as client
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
-
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance('node1', with_zookeeper=True)
 node2 = cluster.add_instance('node2', with_zookeeper=True)
@@ -35,15 +34,15 @@ def test_ttl_columns(started_cluster):
     drop_table([node1, node2], "test_ttl")
     for node in [node1, node2]:
         node.query(
-        '''
-            CREATE TABLE test_ttl(date DateTime, id UInt32, a Int32 TTL date + INTERVAL 1 DAY, b Int32 TTL date + INTERVAL 1 MONTH)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
-            ORDER BY id PARTITION BY toDayOfMonth(date) SETTINGS merge_with_ttl_timeout=0;
-        '''.format(replica=node.name))
+            '''
+                CREATE TABLE test_ttl(date DateTime, id UInt32, a Int32 TTL date + INTERVAL 1 DAY, b Int32 TTL date + INTERVAL 1 MONTH)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
+                ORDER BY id PARTITION BY toDayOfMonth(date) SETTINGS merge_with_ttl_timeout=0;
+            '''.format(replica=node.name))
 
     node1.query("INSERT INTO test_ttl VALUES (toDateTime('2000-10-10 00:00:00'), 1, 1, 3)")
     node1.query("INSERT INTO test_ttl VALUES (toDateTime('2000-10-11 10:00:00'), 2, 2, 4)")
-    time.sleep(1) # sleep to allow use ttl merge selector for second time
+    time.sleep(1)  # sleep to allow use ttl merge selector for second time
     node1.query("OPTIMIZE TABLE test_ttl FINAL")
 
     expected = "1\t0\t0\n2\t0\t0\n"
@@ -56,17 +55,18 @@ def test_merge_with_ttl_timeout(started_cluster):
     drop_table([node1, node2], table)
     for node in [node1, node2]:
         node.query(
-        '''
-            CREATE TABLE {table}(date DateTime, id UInt32, a Int32 TTL date + INTERVAL 1 DAY, b Int32 TTL date + INTERVAL 1 MONTH)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{table}', '{replica}')
-            ORDER BY id PARTITION BY toDayOfMonth(date);
-        '''.format(replica=node.name, table=table))
+            '''
+                CREATE TABLE {table}(date DateTime, id UInt32, a Int32 TTL date + INTERVAL 1 DAY, b Int32 TTL date + INTERVAL 1 MONTH)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{table}', '{replica}')
+                ORDER BY id PARTITION BY toDayOfMonth(date);
+            '''.format(replica=node.name, table=table))
 
     node1.query("SYSTEM STOP TTL MERGES {table}".format(table=table))
     node2.query("SYSTEM STOP TTL MERGES {table}".format(table=table))
 
     for i in range(1, 4):
-        node1.query("INSERT INTO {table} VALUES (toDateTime('2000-10-{day:02d} 10:00:00'), 1, 2, 3)".format(day=i, table=table))
+        node1.query(
+            "INSERT INTO {table} VALUES (toDateTime('2000-10-{day:02d} 10:00:00'), 1, 2, 3)".format(day=i, table=table))
 
     assert node1.query("SELECT countIf(a = 0) FROM {table}".format(table=table)) == "0\n"
     assert node2.query("SELECT countIf(a = 0) FROM {table}".format(table=table)) == "0\n"
@@ -74,12 +74,13 @@ def test_merge_with_ttl_timeout(started_cluster):
     node1.query("SYSTEM START TTL MERGES {table}".format(table=table))
     node2.query("SYSTEM START TTL MERGES {table}".format(table=table))
 
-    time.sleep(15) # TTL merges shall happen.
+    time.sleep(15)  # TTL merges shall happen.
 
     for i in range(1, 4):
-        node1.query("INSERT INTO {table} VALUES (toDateTime('2000-10-{day:02d} 10:00:00'), 1, 2, 3)".format(day=i, table=table))
+        node1.query(
+            "INSERT INTO {table} VALUES (toDateTime('2000-10-{day:02d} 10:00:00'), 1, 2, 3)".format(day=i, table=table))
 
-    time.sleep(15) # TTL merges shall not happen.
+    time.sleep(15)  # TTL merges shall not happen.
 
     assert node1.query("SELECT countIf(a = 0) FROM {table}".format(table=table)) == "3\n"
     assert node2.query("SELECT countIf(a = 0) FROM {table}".format(table=table)) == "3\n"
@@ -89,15 +90,15 @@ def test_ttl_many_columns(started_cluster):
     drop_table([node1, node2], "test_ttl_2")
     for node in [node1, node2]:
         node.query(
-        '''
-            CREATE TABLE test_ttl_2(date DateTime, id UInt32,
-                a Int32 TTL date,
-                _idx Int32 TTL date,
-                _offset Int32 TTL date,
-                _partition Int32 TTL date)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl_2', '{replica}')
-            ORDER BY id PARTITION BY toDayOfMonth(date) SETTINGS merge_with_ttl_timeout=0;
-        '''.format(replica=node.name))
+            '''
+                CREATE TABLE test_ttl_2(date DateTime, id UInt32,
+                    a Int32 TTL date,
+                    _idx Int32 TTL date,
+                    _offset Int32 TTL date,
+                    _partition Int32 TTL date)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl_2', '{replica}')
+                ORDER BY id PARTITION BY toDayOfMonth(date) SETTINGS merge_with_ttl_timeout=0;
+            '''.format(replica=node.name))
 
     node1.query("SYSTEM STOP TTL MERGES test_ttl_2")
     node2.query("SYSTEM STOP TTL MERGES test_ttl_2")
@@ -114,7 +115,7 @@ def test_ttl_many_columns(started_cluster):
     node1.query("SYSTEM START TTL MERGES test_ttl_2")
     node2.query("SYSTEM START TTL MERGES test_ttl_2")
 
-    time.sleep(1) # sleep to allow use ttl merge selector for second time
+    time.sleep(1)  # sleep to allow use ttl merge selector for second time
     node1.query("OPTIMIZE TABLE test_ttl_2 FINAL", timeout=5)
 
     node2.query("SYSTEM SYNC REPLICA test_ttl_2", timeout=5)
@@ -132,32 +133,34 @@ def test_ttl_table(started_cluster, delete_suffix):
     drop_table([node1, node2], "test_ttl")
     for node in [node1, node2]:
         node.query(
-        '''
-            CREATE TABLE test_ttl(date DateTime, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
-            ORDER BY id PARTITION BY toDayOfMonth(date)
-            TTL date + INTERVAL 1 DAY {delete_suffix} SETTINGS merge_with_ttl_timeout=0;
-        '''.format(replica=node.name, delete_suffix=delete_suffix))
+            '''
+                CREATE TABLE test_ttl(date DateTime, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
+                ORDER BY id PARTITION BY toDayOfMonth(date)
+                TTL date + INTERVAL 1 DAY {delete_suffix} SETTINGS merge_with_ttl_timeout=0;
+            '''.format(replica=node.name, delete_suffix=delete_suffix))
 
     node1.query("INSERT INTO test_ttl VALUES (toDateTime('2000-10-10 00:00:00'), 1)")
     node1.query("INSERT INTO test_ttl VALUES (toDateTime('2000-10-11 10:00:00'), 2)")
-    time.sleep(1) # sleep to allow use ttl merge selector for second time
+    time.sleep(1)  # sleep to allow use ttl merge selector for second time
     node1.query("OPTIMIZE TABLE test_ttl FINAL")
 
     assert TSV(node1.query("SELECT * FROM test_ttl")) == TSV("")
     assert TSV(node2.query("SELECT * FROM test_ttl")) == TSV("")
 
+
 def test_modify_ttl(started_cluster):
     drop_table([node1, node2], "test_ttl")
     for node in [node1, node2]:
         node.query(
-        '''
-            CREATE TABLE test_ttl(d DateTime, id UInt32)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
-            ORDER BY id
-        '''.format(replica=node.name))
+            '''
+                CREATE TABLE test_ttl(d DateTime, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
+                ORDER BY id
+            '''.format(replica=node.name))
 
-    node1.query("INSERT INTO test_ttl VALUES (now() - INTERVAL 5 HOUR, 1), (now() - INTERVAL 3 HOUR, 2), (now() - INTERVAL 1 HOUR, 3)")
+    node1.query(
+        "INSERT INTO test_ttl VALUES (now() - INTERVAL 5 HOUR, 1), (now() - INTERVAL 3 HOUR, 2), (now() - INTERVAL 1 HOUR, 3)")
     node2.query("SYSTEM SYNC REPLICA test_ttl", timeout=20)
 
     node1.query("ALTER TABLE test_ttl MODIFY TTL d + INTERVAL 4 HOUR SETTINGS mutations_sync = 2")
@@ -169,17 +172,19 @@ def test_modify_ttl(started_cluster):
     node1.query("ALTER TABLE test_ttl MODIFY TTL d + INTERVAL 30 MINUTE SETTINGS mutations_sync = 2")
     assert node2.query("SELECT id FROM test_ttl") == ""
 
+
 def test_modify_column_ttl(started_cluster):
     drop_table([node1, node2], "test_ttl")
     for node in [node1, node2]:
         node.query(
-        '''
-            CREATE TABLE test_ttl(d DateTime, id UInt32 DEFAULT 42)
-            ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
-            ORDER BY d
-        '''.format(replica=node.name))
+            '''
+                CREATE TABLE test_ttl(d DateTime, id UInt32 DEFAULT 42)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/test_ttl', '{replica}')
+                ORDER BY d
+            '''.format(replica=node.name))
 
-    node1.query("INSERT INTO test_ttl VALUES (now() - INTERVAL 5 HOUR, 1), (now() - INTERVAL 3 HOUR, 2), (now() - INTERVAL 1 HOUR, 3)")
+    node1.query(
+        "INSERT INTO test_ttl VALUES (now() - INTERVAL 5 HOUR, 1), (now() - INTERVAL 3 HOUR, 2), (now() - INTERVAL 1 HOUR, 3)")
     node2.query("SYSTEM SYNC REPLICA test_ttl", timeout=20)
 
     node1.query("ALTER TABLE test_ttl MODIFY COLUMN id UInt32 TTL d + INTERVAL 4 HOUR SETTINGS mutations_sync = 2")
@@ -191,6 +196,7 @@ def test_modify_column_ttl(started_cluster):
     node1.query("ALTER TABLE test_ttl MODIFY COLUMN id UInt32 TTL d + INTERVAL 30 MINUTE SETTINGS mutations_sync = 2")
     assert node2.query("SELECT id FROM test_ttl") == "42\n42\n42\n"
 
+
 def test_ttl_double_delete_rule_returns_error(started_cluster):
     drop_table([node1, node2], "test_ttl")
     try:
@@ -206,6 +212,7 @@ def test_ttl_double_delete_rule_returns_error(started_cluster):
     except:
         assert False
 
+
 @pytest.mark.parametrize("name,engine", [
     ("test_ttl_alter_delete", "MergeTree()"),
     ("test_replicated_ttl_alter_delete", "ReplicatedMergeTree('/clickhouse/test_replicated_ttl_alter_delete', '1')"),
@@ -238,21 +245,24 @@ limitations under the License."""
                 break
             except:
                 time.sleep(0.5)
+
     node1.query(
-    """
-        CREATE TABLE {name} (
-            s1 String,
-            d1 DateTime
-        ) ENGINE = {engine}
-        ORDER BY tuple()
-        TTL d1 + INTERVAL 1 DAY DELETE
-    """.format(name=name, engine=engine))
+        """
+            CREATE TABLE {name} (
+                s1 String,
+                d1 DateTime
+            ) ENGINE = {engine}
+            ORDER BY tuple()
+            TTL d1 + INTERVAL 1 DAY DELETE
+        """.format(name=name, engine=engine))
 
     node1.query("""ALTER TABLE {name} MODIFY COLUMN s1 String TTL d1 + INTERVAL 1 SECOND""".format(name=name))
     node1.query("""ALTER TABLE {name} ADD COLUMN b1 Int32""".format(name=name))
 
-    node1.query("""INSERT INTO {name} (s1, b1, d1) VALUES ('hello1', 1, toDateTime({time}))""".format(name=name, time=time.time()))
-    node1.query("""INSERT INTO {name} (s1, b1, d1) VALUES ('hello2', 2, toDateTime({time}))""".format(name=name, time=time.time() + 360))
+    node1.query("""INSERT INTO {name} (s1, b1, d1) VALUES ('hello1', 1, toDateTime({time}))""".format(name=name,
+                                                                                                      time=time.time()))
+    node1.query("""INSERT INTO {name} (s1, b1, d1) VALUES ('hello2', 2, toDateTime({time}))""".format(name=name,
+                                                                                                      time=time.time() + 360))
 
     time.sleep(1)
 
@@ -261,7 +271,8 @@ limitations under the License."""
     assert r == ["\t1", "hello2\t2"]
 
     node1.query("""ALTER TABLE {name} MODIFY COLUMN b1 Int32 TTL d1""".format(name=name))
-    node1.query("""INSERT INTO {name} (s1, b1, d1) VALUES ('hello3', 3, toDateTime({time}))""".format(name=name, time=time.time()))
+    node1.query("""INSERT INTO {name} (s1, b1, d1) VALUES ('hello3', 3, toDateTime({time}))""".format(name=name,
+                                                                                                      time=time.time()))
 
     time.sleep(1)
 
diff --git a/tests/integration/test_union_header/test.py b/tests/integration/test_union_header/test.py
index 7b671f03386..edbf4dddecf 100644
--- a/tests/integration/test_union_header/test.py
+++ b/tests/integration/test_union_header/test.py
@@ -14,7 +14,6 @@ def started_cluster():
         cluster.start()
 
         for node in (node1, node2):
-
             node.query('''
             CREATE TABLE default.t1_local
             (
diff --git a/tests/integration/test_user_directories/test.py b/tests/integration/test_user_directories/test.py
index 0a6e037904e..84547293f0d 100644
--- a/tests/integration/test_user_directories/test.py
+++ b/tests/integration/test_user_directories/test.py
@@ -1,5 +1,6 @@
-import pytest
 import os
+
+import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
@@ -7,6 +8,7 @@ SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', stay_alive=True)
 
+
 @pytest.fixture(scope="module", autouse=True)
 def started_cluster():
     try:
@@ -22,42 +24,56 @@ def started_cluster():
 
 
 def test_old_style():
-    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/old_style.xml"), '/etc/clickhouse-server/config.d/z.xml')
+    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/old_style.xml"),
+                                '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users2.xml"}',    1],
-                                                                       ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access2\\\\/"}', 2]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV(
+        [["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users2.xml"}', 1],
+         ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access2\\\\/"}', 2]])
 
 
 def test_local_directories():
-    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/local_directories.xml"), '/etc/clickhouse-server/config.d/z.xml')
+    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/local_directories.xml"),
+                                '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",            "users.xml",       '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users3.xml"}',                       1],
-                                                                       ["local directory",      "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access3\\\\/"}',                    2],
-                                                                       ["local directory (ro)", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access3-ro\\\\/","readonly":true}', 3]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV(
+        [["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users3.xml"}', 1],
+         ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access3\\\\/"}', 2],
+         ["local directory (ro)", "local directory",
+          '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access3-ro\\\\/","readonly":true}', 3]])
 
 
 def test_relative_path():
-    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/relative_path.xml"), '/etc/clickhouse-server/config.d/z.xml')
+    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/relative_path.xml"),
+                                '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users4.xml"}', 1]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV(
+        [["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users4.xml"}', 1]])
 
 
 def test_memory():
     node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/memory.xml"), '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users5.xml"}', 1],
-                                                                       ["memory",    "memory",    '{}',                                                       2]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV(
+        [["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users5.xml"}', 1],
+         ["memory", "memory", '{}', 2]])
+
 
 def test_mixed_style():
-    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/mixed_style.xml"), '/etc/clickhouse-server/config.d/z.xml')
+    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/mixed_style.xml"),
+                                '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users6.xml"}',     1],
-                                                                       ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access6\\\\/"}',  2],
-                                                                       ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access6a\\\\/"}', 3],
-                                                                       ["memory",          "memory",          '{}',                                                           4]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV(
+        [["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users6.xml"}', 1],
+         ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access6\\\\/"}', 2],
+         ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access6a\\\\/"}', 3],
+         ["memory", "memory", '{}', 4]])
+
 
 def test_duplicates():
-    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/duplicates.xml"), '/etc/clickhouse-server/config.d/z.xml')
+    node.copy_file_to_container(os.path.join(SCRIPT_DIR, "configs/duplicates.xml"),
+                                '/etc/clickhouse-server/config.d/z.xml')
     node.restart_clickhouse()
-    assert node.query("SELECT * FROM system.user_directories") == TSV([["users.xml",       "users.xml",       '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users7.xml"}',    1],
-                                                                       ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access7\\\\/"}', 2]])
+    assert node.query("SELECT * FROM system.user_directories") == TSV(
+        [["users.xml", "users.xml", '{"path":"\\\\/etc\\\\/clickhouse-server\\\\/users7.xml"}', 1],
+         ["local directory", "local directory", '{"path":"\\\\/var\\\\/lib\\\\/clickhouse\\\\/access7\\\\/"}', 2]])
diff --git a/tests/integration/test_user_ip_restrictions/test.py b/tests/integration/test_user_ip_restrictions/test.py
index aee0819fe95..1f28fbde069 100644
--- a/tests/integration/test_user_ip_restrictions/test.py
+++ b/tests/integration/test_user_ip_restrictions/test.py
@@ -1,22 +1,26 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
 
-from helpers.test_tools import assert_eq_with_retry
-
 cluster = ClickHouseCluster(__file__)
 
-node_ipv4 = cluster.add_instance('node_ipv4', main_configs=[], user_configs=['configs/users_ipv4.xml'], ipv4_address='10.5.172.77')
+node_ipv4 = cluster.add_instance('node_ipv4', main_configs=[], user_configs=['configs/users_ipv4.xml'],
+                                 ipv4_address='10.5.172.77')
 client_ipv4_ok = cluster.add_instance('client_ipv4_ok', main_configs=[], user_configs=[], ipv4_address='10.5.172.10')
-client_ipv4_ok_direct = cluster.add_instance('client_ipv4_ok_direct', main_configs=[], user_configs=[], ipv4_address='10.5.173.1')
-client_ipv4_ok_full_mask = cluster.add_instance('client_ipv4_ok_full_mask', main_configs=[], user_configs=[], ipv4_address='10.5.175.77')
+client_ipv4_ok_direct = cluster.add_instance('client_ipv4_ok_direct', main_configs=[], user_configs=[],
+                                             ipv4_address='10.5.173.1')
+client_ipv4_ok_full_mask = cluster.add_instance('client_ipv4_ok_full_mask', main_configs=[], user_configs=[],
+                                                ipv4_address='10.5.175.77')
 client_ipv4_bad = cluster.add_instance('client_ipv4_bad', main_configs=[], user_configs=[], ipv4_address='10.5.173.10')
 
-node_ipv6 = cluster.add_instance('node_ipv6', main_configs=["configs/config_ipv6.xml"], user_configs=['configs/users_ipv6.xml'], ipv6_address='2001:3984:3989::1:1000')
-client_ipv6_ok = cluster.add_instance('client_ipv6_ok', main_configs=[], user_configs=[], ipv6_address='2001:3984:3989::5555')
-client_ipv6_ok_direct = cluster.add_instance('client_ipv6_ok_direct', main_configs=[], user_configs=[], ipv6_address='2001:3984:3989::1:1111')
-client_ipv6_bad = cluster.add_instance('client_ipv6_bad', main_configs=[], user_configs=[], ipv6_address='2001:3984:3989::1:1112')
+node_ipv6 = cluster.add_instance('node_ipv6', main_configs=["configs/config_ipv6.xml"],
+                                 user_configs=['configs/users_ipv6.xml'], ipv6_address='2001:3984:3989::1:1000')
+client_ipv6_ok = cluster.add_instance('client_ipv6_ok', main_configs=[], user_configs=[],
+                                      ipv6_address='2001:3984:3989::5555')
+client_ipv6_ok_direct = cluster.add_instance('client_ipv6_ok_direct', main_configs=[], user_configs=[],
+                                             ipv6_address='2001:3984:3989::1:1111')
+client_ipv6_bad = cluster.add_instance('client_ipv6_bad', main_configs=[], user_configs=[],
+                                       ipv6_address='2001:3984:3989::1:1112')
 
 
 @pytest.fixture(scope="module")
@@ -31,42 +35,57 @@ def setup_cluster():
 
 def test_ipv4(setup_cluster):
     try:
-        client_ipv4_ok.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host 10.5.172.77 --query 'select 1'"], privileged=True, user='root')
+        client_ipv4_ok.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --host 10.5.172.77 --query 'select 1'"], privileged=True,
+            user='root')
     except Exception as ex:
         assert False, "allowed client with 10.5.172.10 cannot connect to server with allowed mask '10.5.172.0/24'"
 
     try:
-        client_ipv4_ok_direct.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host 10.5.172.77 --query 'select 1'"], privileged=True, user='root')
+        client_ipv4_ok_direct.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --host 10.5.172.77 --query 'select 1'"], privileged=True,
+            user='root')
     except Exception as ex:
         assert False, "allowed client with 10.5.173.1 cannot connect to server with allowed ip '10.5.173.1'"
 
     try:
-        client_ipv4_ok_full_mask.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host 10.5.172.77 --query 'select 1'"], privileged=True, user='root')
+        client_ipv4_ok_full_mask.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --host 10.5.172.77 --query 'select 1'"], privileged=True,
+            user='root')
     except Exception as ex:
         assert False, "allowed client with 10.5.175.77 cannot connect to server with allowed ip '10.5.175.0/255.255.255.0'"
 
     try:
-        client_ipv4_bad.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host 10.5.172.77 --query 'select 1'"], privileged=True, user='root')
+        client_ipv4_bad.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --host 10.5.172.77 --query 'select 1'"], privileged=True,
+            user='root')
         assert False, "restricted client with 10.5.173.10 can connect to server with allowed mask '10.5.172.0/24'"
     except AssertionError:
         raise
     except Exception as ex:
         print ex
 
+
 def test_ipv6(setup_cluster):
     try:
-        client_ipv6_ok.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host 2001:3984:3989::1:1000 --query 'select 1'"], privileged=True, user='root')
+        client_ipv6_ok.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --host 2001:3984:3989::1:1000 --query 'select 1'"],
+            privileged=True, user='root')
     except Exception as ex:
         print ex
         assert False, "allowed client with 2001:3984:3989:0:0:0:1:1111 cannot connect to server with allowed mask '2001:3984:3989:0:0:0:0:0/112'"
 
     try:
-        client_ipv6_ok_direct.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host 2001:3984:3989:0:0:0:1:1000 --query 'select 1'"], privileged=True, user='root')
+        client_ipv6_ok_direct.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --host 2001:3984:3989:0:0:0:1:1000 --query 'select 1'"],
+            privileged=True, user='root')
     except Exception as ex:
         assert False, "allowed client with 2001:3984:3989:0:0:0:1:1111 cannot connect to server with allowed ip '2001:3984:3989:0:0:0:1:1111'"
 
     try:
-        client_ipv6_bad.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --host 2001:3984:3989:0:0:0:1:1000 --query 'select 1'"], privileged=True, user='root')
+        client_ipv6_bad.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --host 2001:3984:3989:0:0:0:1:1000 --query 'select 1'"],
+            privileged=True, user='root')
         assert False, "restricted client with 2001:3984:3989:0:0:0:1:1112 can connect to server with allowed mask '2001:3984:3989:0:0:0:0:0/112'"
     except AssertionError:
         raise
diff --git a/tests/integration/test_user_zero_database_access/test_user_zero_database_access.py b/tests/integration/test_user_zero_database_access/test_user_zero_database_access.py
index 3af5c18544a..c5ea7ed60a0 100644
--- a/tests/integration/test_user_zero_database_access/test_user_zero_database_access.py
+++ b/tests/integration/test_user_zero_database_access/test_user_zero_database_access.py
@@ -1,9 +1,7 @@
-import time
 import pytest
 
 from helpers.cluster import ClickHouseCluster
 
-
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance('node', user_configs=["configs/users.xml"])
 
@@ -20,7 +18,8 @@ def start_cluster():
 
 def test_user_zero_database_access(start_cluster):
     try:
-        node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --user 'no_access' --query 'DROP DATABASE test'"], user='root')
+        node.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --user 'no_access' --query 'DROP DATABASE test'"], user='root')
         assert False, "user with no access rights dropped database test"
     except AssertionError:
         raise
@@ -28,17 +27,22 @@ def test_user_zero_database_access(start_cluster):
         print ex
 
     try:
-        node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --user 'has_access' --query 'DROP DATABASE test'"], user='root')
+        node.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --user 'has_access' --query 'DROP DATABASE test'"], user='root')
     except Exception as ex:
         assert False, "user with access rights can't drop database test"
 
     try:
-        node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --user 'has_access' --query 'CREATE DATABASE test'"], user='root')
+        node.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --user 'has_access' --query 'CREATE DATABASE test'"],
+            user='root')
     except Exception as ex:
         assert False, "user with access rights can't create database test"
 
     try:
-        node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --user 'no_access' --query 'CREATE DATABASE test2'"], user='root')
+        node.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --user 'no_access' --query 'CREATE DATABASE test2'"],
+            user='root')
         assert False, "user with no access rights created database test2"
     except AssertionError:
         raise
@@ -46,7 +50,9 @@ def test_user_zero_database_access(start_cluster):
         print ex
 
     try:
-        node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --user 'has_access' --query 'CREATE DATABASE test2'"], user='root')
+        node.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --user 'has_access' --query 'CREATE DATABASE test2'"],
+            user='root')
         assert False, "user with limited access rights created database test2 which is outside of his scope of rights"
     except AssertionError:
         raise
@@ -54,11 +60,13 @@ def test_user_zero_database_access(start_cluster):
         print ex
 
     try:
-        node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --user 'default' --query 'CREATE DATABASE test2'"], user='root')
+        node.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --user 'default' --query 'CREATE DATABASE test2'"], user='root')
     except Exception as ex:
         assert False, "user with full access rights can't create database test2"
 
     try:
-        node.exec_in_container(["bash", "-c", "/usr/bin/clickhouse client --user 'default' --query 'DROP DATABASE test2'"], user='root')
+        node.exec_in_container(
+            ["bash", "-c", "/usr/bin/clickhouse client --user 'default' --query 'DROP DATABASE test2'"], user='root')
     except Exception as ex:
-        assert False, "user with full access rights can't drop database test2"
\ No newline at end of file
+        assert False, "user with full access rights can't drop database test2"
diff --git a/tests/integration/test_version_update_after_mutation/test.py b/tests/integration/test_version_update_after_mutation/test.py
index f78dbf18c0d..68c2c65cbf2 100644
--- a/tests/integration/test_version_update_after_mutation/test.py
+++ b/tests/integration/test_version_update_after_mutation/test.py
@@ -5,9 +5,13 @@ from helpers.test_tools import assert_eq_with_retry
 
 cluster = ClickHouseCluster(__file__)
 
-node1 = cluster.add_instance('node1', with_zookeeper=True, image='yandex/clickhouse-server', tag='20.1.10.70', with_installed_binary=True, stay_alive=True)
-node2 = cluster.add_instance('node2', with_zookeeper=True, image='yandex/clickhouse-server', tag='20.1.10.70', with_installed_binary=True, stay_alive=True)
-node3 = cluster.add_instance('node3', with_zookeeper=True, image='yandex/clickhouse-server', tag='20.1.10.70', with_installed_binary=True, stay_alive=True)
+node1 = cluster.add_instance('node1', with_zookeeper=True, image='yandex/clickhouse-server', tag='20.1.10.70',
+                             with_installed_binary=True, stay_alive=True)
+node2 = cluster.add_instance('node2', with_zookeeper=True, image='yandex/clickhouse-server', tag='20.1.10.70',
+                             with_installed_binary=True, stay_alive=True)
+node3 = cluster.add_instance('node3', with_zookeeper=True, image='yandex/clickhouse-server', tag='20.1.10.70',
+                             with_installed_binary=True, stay_alive=True)
+
 
 @pytest.fixture(scope="module")
 def start_cluster():
@@ -21,7 +25,9 @@ def start_cluster():
 
 def test_mutate_and_upgrade(start_cluster):
     for node in [node1, node2]:
-        node.query("CREATE TABLE mt (EventDate Date, id UInt64) ENGINE ReplicatedMergeTree('/clickhouse/tables/t', '{}') ORDER BY tuple()".format(node.name))
+        node.query(
+            "CREATE TABLE mt (EventDate Date, id UInt64) ENGINE ReplicatedMergeTree('/clickhouse/tables/t', '{}') ORDER BY tuple()".format(
+                node.name))
 
     node1.query("INSERT INTO mt VALUES ('2020-02-13', 1), ('2020-02-13', 2);")
 
@@ -52,7 +58,8 @@ def test_mutate_and_upgrade(start_cluster):
     assert node1.query("SELECT COUNT() FROM mt") == "2\n"
     assert node2.query("SELECT COUNT() FROM mt") == "2\n"
 
-    node1.query("ALTER TABLE mt MODIFY COLUMN id String DEFAULT '0'", settings={"replication_alter_partitions_sync": "2"})
+    node1.query("ALTER TABLE mt MODIFY COLUMN id String DEFAULT '0'",
+                settings={"replication_alter_partitions_sync": "2"})
 
     node2.query("OPTIMIZE TABLE mt FINAL")
 
@@ -61,7 +68,8 @@ def test_mutate_and_upgrade(start_cluster):
 
 
 def test_upgrade_while_mutation(start_cluster):
-    node3.query("CREATE TABLE mt1 (EventDate Date, id UInt64) ENGINE ReplicatedMergeTree('/clickhouse/tables/t1', 'node3') ORDER BY tuple()")
+    node3.query(
+        "CREATE TABLE mt1 (EventDate Date, id UInt64) ENGINE ReplicatedMergeTree('/clickhouse/tables/t1', 'node3') ORDER BY tuple()")
 
     node3.query("INSERT INTO mt1 select '2020-02-13', number from numbers(100000)")
 
diff --git a/tests/integration/test_zookeeper_config/test.py b/tests/integration/test_zookeeper_config/test.py
index 086b9ac0c73..9bc206d8da4 100644
--- a/tests/integration/test_zookeeper_config/test.py
+++ b/tests/integration/test_zookeeper_config/test.py
@@ -1,24 +1,30 @@
 from __future__ import print_function
-from helpers.cluster import ClickHouseCluster
+
+import time
+from os import path as p, unlink
+from tempfile import NamedTemporaryFile
+
 import helpers
 import pytest
-import time
-from tempfile import NamedTemporaryFile
-from os import path as p, unlink
+from helpers.cluster import ClickHouseCluster
 
 
 def test_chroot_with_same_root():
-
     cluster_1 = ClickHouseCluster(__file__, zookeeper_config_path='configs/zookeeper_config_root_a.xml')
     cluster_2 = ClickHouseCluster(__file__, zookeeper_config_path='configs/zookeeper_config_root_a.xml')
 
-    node1 = cluster_1.add_instance('node1', main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_root_a.xml"], with_zookeeper=True, zookeeper_use_tmpfs=False)
-    node2 = cluster_2.add_instance('node2', main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_root_a.xml"], with_zookeeper=True, zookeeper_use_tmpfs=False)
+    node1 = cluster_1.add_instance('node1',
+                                   main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_root_a.xml"],
+                                   with_zookeeper=True, zookeeper_use_tmpfs=False)
+    node2 = cluster_2.add_instance('node2',
+                                   main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_root_a.xml"],
+                                   with_zookeeper=True, zookeeper_use_tmpfs=False)
     nodes = [node1, node2]
 
     def create_zk_root(zk):
         zk.ensure_path('/root_a')
         print(zk.get_children('/'))
+
     cluster_1.add_zookeeper_startup_command(create_zk_root)
 
     try:
@@ -31,7 +37,7 @@ def test_chroot_with_same_root():
                 CREATE TABLE simple (date Date, id UInt32)
                 ENGINE = ReplicatedMergeTree('/clickhouse/tables/0/simple', '{replica}', date, id, 8192);
                 '''.format(replica=node.name))
-                for j in range(2): # Second insert to test deduplication
+                for j in range(2):  # Second insert to test deduplication
                     node.query("INSERT INTO simple VALUES ({0}, {0})".format(i))
 
             time.sleep(1)
@@ -47,18 +53,22 @@ def test_chroot_with_same_root():
 
 
 def test_chroot_with_different_root():
-
     cluster_1 = ClickHouseCluster(__file__, zookeeper_config_path='configs/zookeeper_config_root_a.xml')
     cluster_2 = ClickHouseCluster(__file__, zookeeper_config_path='configs/zookeeper_config_root_b.xml')
 
-    node1 = cluster_1.add_instance('node1', main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_root_a.xml"], with_zookeeper=True, zookeeper_use_tmpfs=False)
-    node2 = cluster_2.add_instance('node2', main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_root_b.xml"], with_zookeeper=True, zookeeper_use_tmpfs=False)
+    node1 = cluster_1.add_instance('node1',
+                                   main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_root_a.xml"],
+                                   with_zookeeper=True, zookeeper_use_tmpfs=False)
+    node2 = cluster_2.add_instance('node2',
+                                   main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_root_b.xml"],
+                                   with_zookeeper=True, zookeeper_use_tmpfs=False)
     nodes = [node1, node2]
 
     def create_zk_roots(zk):
         zk.ensure_path('/root_a')
         zk.ensure_path('/root_b')
         print(zk.get_children('/'))
+
     cluster_1.add_zookeeper_startup_command(create_zk_roots)
 
     try:
@@ -72,7 +82,7 @@ def test_chroot_with_different_root():
                 CREATE TABLE simple (date Date, id UInt32)
                 ENGINE = ReplicatedMergeTree('/clickhouse/tables/0/simple', '{replica}', date, id, 8192);
                 '''.format(replica=node.name))
-                for j in range(2): # Second insert to test deduplication
+                for j in range(2):  # Second insert to test deduplication
                     node.query("INSERT INTO simple VALUES ({0}, {0})".format(i))
 
             assert node1.query('select count() from simple').strip() == '1'
@@ -86,12 +96,14 @@ def test_chroot_with_different_root():
 
 
 def test_identity():
-
     cluster_1 = ClickHouseCluster(__file__, zookeeper_config_path='configs/zookeeper_config_with_password.xml')
     cluster_2 = ClickHouseCluster(__file__)
 
-    node1 = cluster_1.add_instance('node1', main_configs=["configs/remote_servers.xml", "configs/zookeeper_config_with_password.xml"], with_zookeeper=True, zookeeper_use_tmpfs=False)
-    node2 = cluster_2.add_instance('node2', main_configs=["configs/remote_servers.xml"], with_zookeeper=True, zookeeper_use_tmpfs=False)
+    node1 = cluster_1.add_instance('node1', main_configs=["configs/remote_servers.xml",
+                                                          "configs/zookeeper_config_with_password.xml"],
+                                   with_zookeeper=True, zookeeper_use_tmpfs=False)
+    node2 = cluster_2.add_instance('node2', main_configs=["configs/remote_servers.xml"], with_zookeeper=True,
+                                   zookeeper_use_tmpfs=False)
 
     try:
         cluster_1.start()
@@ -146,11 +158,15 @@ def test_secure_connection():
     docker_compose.close()
 
     node1 = cluster.add_instance('node1', main_configs=["configs_secure/client.crt", "configs_secure/client.key",
-                                                        "configs_secure/conf.d/remote_servers.xml", "configs_secure/conf.d/ssl_conf.xml"],
-                                 with_zookeeper=True, zookeeper_docker_compose_path=docker_compose.name, zookeeper_use_tmpfs=False)
+                                                        "configs_secure/conf.d/remote_servers.xml",
+                                                        "configs_secure/conf.d/ssl_conf.xml"],
+                                 with_zookeeper=True, zookeeper_docker_compose_path=docker_compose.name,
+                                 zookeeper_use_tmpfs=False)
     node2 = cluster.add_instance('node2', main_configs=["configs_secure/client.crt", "configs_secure/client.key",
-                                                        "configs_secure/conf.d/remote_servers.xml", "configs_secure/conf.d/ssl_conf.xml"],
-                                 with_zookeeper=True, zookeeper_docker_compose_path=docker_compose.name, zookeeper_use_tmpfs=False)
+                                                        "configs_secure/conf.d/remote_servers.xml",
+                                                        "configs_secure/conf.d/ssl_conf.xml"],
+                                 with_zookeeper=True, zookeeper_docker_compose_path=docker_compose.name,
+                                 zookeeper_use_tmpfs=False)
 
     try:
         cluster.start()

From 172bc46c630257532eb893b8d8fbc1d12316b854 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Wed, 16 Sep 2020 14:52:59 +0800
Subject: [PATCH 262/341] Fix format and dryrun event parse failure

---
 src/Core/MySQL/MySQLReplication.cpp | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index a46d787b225..c7593799caf 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -50,14 +50,13 @@ namespace MySQLReplication
     {
         payload.readStrict(reinterpret_cast<char *>(&binlog_version), 2);
         assert(binlog_version == EVENT_VERSION_V4);
+        server_version.resize(50);
         payload.readStrict(reinterpret_cast<char *>(server_version.data()), 50);
         payload.readStrict(reinterpret_cast<char *>(&create_timestamp), 4);
         payload.readStrict(reinterpret_cast<char *>(&event_header_length), 1);
         assert(event_header_length == EVENT_HEADER_LENGTH);
 
-        size_t len = header.event_size - (2 + 50 + 4 + 1 + EVENT_HEADER_LENGTH) - 1;
-        event_type_header_length.resize(len);
-        payload.readStrict(reinterpret_cast<char *>(event_type_header_length.data()), len);
+        readStringUntilEOF(event_type_header_length, payload);
     }
 
     void FormatDescriptionEvent::dump(std::ostream & out) const
@@ -750,7 +749,7 @@ namespace MySQLReplication
         out << "GTID Next: " << gtid_next << std::endl;
     }
 
-    void DryRunEvent::parseImpl(ReadBuffer & payload) { payload.ignore(header.event_size - EVENT_HEADER_LENGTH); }
+    void DryRunEvent::parseImpl(ReadBuffer & payload) { payload.ignoreAll(); }
 
     void DryRunEvent::dump(std::ostream & out) const
     {

From 74c0b6eb768a4a2f734fb5b4d9fa9c7d3cac4b4d Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 10:00:41 +0300
Subject: [PATCH 263/341] Update CompressionCodecGorilla.cpp

---
 src/Compression/CompressionCodecGorilla.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Compression/CompressionCodecGorilla.cpp b/src/Compression/CompressionCodecGorilla.cpp
index 0f622e5ccaa..865dc7e1a16 100644
--- a/src/Compression/CompressionCodecGorilla.cpp
+++ b/src/Compression/CompressionCodecGorilla.cpp
@@ -242,7 +242,7 @@ UInt8 getDataBytesSize(DataTypePtr column_type)
 CompressionCodecGorilla::CompressionCodecGorilla(UInt8 data_bytes_size_)
     : data_bytes_size(data_bytes_size_)
 {
-    setCodecDescription("DoubleDelta", {});
+    setCodecDescription("Gorilla", {});
 }
 
 uint8_t CompressionCodecGorilla::getMethodByte() const

From 9246e77b05654efbe9dd773580f187db56689784 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Wed, 16 Sep 2020 15:05:44 +0800
Subject: [PATCH 264/341] Remove CHECKSUM_CRC32_SIGNATURE_LENGTH in mysql event
 parser

---
 src/Core/MySQL/MySQLReplication.cpp | 4 +---
 src/Core/MySQL/MySQLReplication.h   | 1 -
 2 files changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index c7593799caf..c874f0aad67 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -72,9 +72,7 @@ namespace MySQLReplication
     void RotateEvent::parseImpl(ReadBuffer & payload)
     {
         payload.readStrict(reinterpret_cast<char *>(&position), 8);
-        size_t len = header.event_size - EVENT_HEADER_LENGTH - 8 - CHECKSUM_CRC32_SIGNATURE_LENGTH;
-        next_binlog.resize(len);
-        payload.readStrict(reinterpret_cast<char *>(next_binlog.data()), len);
+        readStringUntilEOF(next_binlog, payload);
     }
 
     void RotateEvent::dump(std::ostream & out) const
diff --git a/src/Core/MySQL/MySQLReplication.h b/src/Core/MySQL/MySQLReplication.h
index ad5e53ed200..5f5ff23d0d9 100644
--- a/src/Core/MySQL/MySQLReplication.h
+++ b/src/Core/MySQL/MySQLReplication.h
@@ -19,7 +19,6 @@ namespace MySQLReplication
 {
     static const int EVENT_VERSION_V4 = 4;
     static const int EVENT_HEADER_LENGTH = 19;
-    static const int CHECKSUM_CRC32_SIGNATURE_LENGTH = 4;
 
     using Bitmap = boost::dynamic_bitset<>;
 

From d14442121405c19a7c6130fb9eab52ec2b271c4a Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 10:46:38 +0300
Subject: [PATCH 265/341] Disable lto for glibc-compatibility

---
 base/glibc-compatibility/CMakeLists.txt | 3 +++
 docker/test/fuzzer/run-fuzzer.sh        | 4 ++--
 2 files changed, 5 insertions(+), 2 deletions(-)

diff --git a/base/glibc-compatibility/CMakeLists.txt b/base/glibc-compatibility/CMakeLists.txt
index 2bd4e20d3bc..42b478d50d9 100644
--- a/base/glibc-compatibility/CMakeLists.txt
+++ b/base/glibc-compatibility/CMakeLists.txt
@@ -34,6 +34,9 @@ if (GLIBC_COMPATIBILITY)
 
     if (COMPILER_CLANG)
         target_compile_options(glibc-compatibility PRIVATE -Wno-unused-command-line-argument)
+        # disable lto for this library, because for some reason clang-11 fails
+        # to link llvm with it.
+        target_compile_options(glibc-compatibility PRIVATE -fno-lto)
     elseif (COMPILER_GCC)
         target_compile_options(glibc-compatibility PRIVATE -Wno-unused-but-set-variable)
     endif ()
diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index 3d70faca5e0..bcac5a433cc 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -35,7 +35,7 @@ function download
 #    wget -O- -nv -nd -c "https://clickhouse-builds.s3.yandex.net/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/performance/performance.tgz" \
 #        | tar --strip-components=1 -zxv
 
-    wget -nv -nd -c "https://clickhouse-builds.s3.yandex.net/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/clang-10_debug_none_bundled_unsplitted_disable_False_binary/clickhouse"
+    wget -nv -nd -c "https://clickhouse-builds.s3.yandex.net/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/clang-11_debug_none_bundled_unsplitted_disable_False_binary/clickhouse"
     chmod +x clickhouse
     ln -s ./clickhouse ./clickhouse-server
     ln -s ./clickhouse ./clickhouse-client
@@ -227,4 +227,4 @@ EOF
     ;&
 esac
 
-exit $task_exit_code
\ No newline at end of file
+exit $task_exit_code

From da386990fe606e427e3b6472a59ea8cba17e32c9 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 11:18:42 +0300
Subject: [PATCH 266/341] Update ICompressionCodec.cpp

---
 src/Compression/ICompressionCodec.cpp | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/src/Compression/ICompressionCodec.cpp b/src/Compression/ICompressionCodec.cpp
index 4efe0c0ef3c..021bf6f6fe6 100644
--- a/src/Compression/ICompressionCodec.cpp
+++ b/src/Compression/ICompressionCodec.cpp
@@ -24,7 +24,9 @@ void ICompressionCodec::setCodecDescription(const String & codec_name, const AST
 {
     std::shared_ptr<ASTFunction> result = std::make_shared<ASTFunction>();
     result->name = "CODEC";
-
+    
+    /// Special case for codec Multiple, which doens't have name. It's just list
+    /// of other codecs.
     if (codec_name.empty())
     {
         ASTPtr codec_desc = std::make_shared<ASTExpressionList>();
@@ -35,9 +37,9 @@ void ICompressionCodec::setCodecDescription(const String & codec_name, const AST
     else
     {
         ASTPtr codec_desc;
-        if (arguments.empty())
+        if (arguments.empty()) /// Codec without arguments is just ASTIdentifier
             codec_desc = std::make_shared<ASTIdentifier>(codec_name);
-        else
+        else /// Codec with arguments represented as ASTFunction
             codec_desc = makeASTFunction(codec_name, arguments);
 
         result->arguments = std::make_shared<ASTExpressionList>();
@@ -62,9 +64,10 @@ ASTPtr ICompressionCodec::getCodecDesc() const
 {
 
     auto arguments = getFullCodecDesc()->as<ASTFunction>()->arguments;
+    /// If it has exactly one argument, than it's single codec, return it
     if (arguments->children.size() == 1)
         return arguments->children[0];
-    else
+    else  /// Otherwise we have multiple codecs and return them as expression list
         return arguments;
 }
 

From e3299d9249d266b21db6428724c89c2c113c24af Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 11:19:59 +0300
Subject: [PATCH 267/341] Update CompressionCodecMultiple.cpp

---
 src/Compression/CompressionCodecMultiple.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Compression/CompressionCodecMultiple.cpp b/src/Compression/CompressionCodecMultiple.cpp
index 7c95db0c972..a0336d66a05 100644
--- a/src/Compression/CompressionCodecMultiple.cpp
+++ b/src/Compression/CompressionCodecMultiple.cpp
@@ -26,7 +26,7 @@ CompressionCodecMultiple::CompressionCodecMultiple(Codecs codecs_)
     ASTs arguments;
     for (const auto & codec : codecs)
         arguments.push_back(codec->getCodecDesc());
-
+    /// Special case, codec doesn't have name and contain list of codecs.
     setCodecDescription("", arguments);
 }
 

From cf45eb1545c0d1be14d9e8ce798e0ddfdc3e904b Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 11:20:22 +0300
Subject: [PATCH 268/341] Update CompressionCodecDoubleDelta.cpp

---
 src/Compression/CompressionCodecDoubleDelta.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Compression/CompressionCodecDoubleDelta.cpp b/src/Compression/CompressionCodecDoubleDelta.cpp
index 2c18b1e1127..96fd29fe356 100644
--- a/src/Compression/CompressionCodecDoubleDelta.cpp
+++ b/src/Compression/CompressionCodecDoubleDelta.cpp
@@ -327,7 +327,7 @@ UInt8 getDataBytesSize(DataTypePtr column_type)
 CompressionCodecDoubleDelta::CompressionCodecDoubleDelta(UInt8 data_bytes_size_)
     : data_bytes_size(data_bytes_size_)
 {
-    setCodecDescription("DoubleDelta", {});
+    setCodecDescription("DoubleDelta");
 }
 
 uint8_t CompressionCodecDoubleDelta::getMethodByte() const

From af8ed46261447b78afd3d58ce33086e85593a279 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 11:20:39 +0300
Subject: [PATCH 269/341] Update CompressionCodecGorilla.cpp

---
 src/Compression/CompressionCodecGorilla.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Compression/CompressionCodecGorilla.cpp b/src/Compression/CompressionCodecGorilla.cpp
index 865dc7e1a16..d739623a94b 100644
--- a/src/Compression/CompressionCodecGorilla.cpp
+++ b/src/Compression/CompressionCodecGorilla.cpp
@@ -242,7 +242,7 @@ UInt8 getDataBytesSize(DataTypePtr column_type)
 CompressionCodecGorilla::CompressionCodecGorilla(UInt8 data_bytes_size_)
     : data_bytes_size(data_bytes_size_)
 {
-    setCodecDescription("Gorilla", {});
+    setCodecDescription("Gorilla");
 }
 
 uint8_t CompressionCodecGorilla::getMethodByte() const

From 78cb39ff92faa73f766e284250ea6cd4d9faab48 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 11:21:39 +0300
Subject: [PATCH 270/341] Update ICompressionCodec.h

---
 src/Compression/ICompressionCodec.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Compression/ICompressionCodec.h b/src/Compression/ICompressionCodec.h
index 44b7aca43e1..c931a04bdc2 100644
--- a/src/Compression/ICompressionCodec.h
+++ b/src/Compression/ICompressionCodec.h
@@ -87,7 +87,8 @@ protected:
 
     /// Actually decompress data without header
     virtual void doDecompressData(const char * source, UInt32 source_size, char * dest, UInt32 uncompressed_size) const = 0;
-
+    
+    /// Construct and set codec description from codec name and arguments. Must be called in codec constructor.
     void setCodecDescription(const String & name, const ASTs & arguments = {});
 
 private:

From c5c5faf8ee46228288a1efc70baf794aac27b363 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Wed, 16 Sep 2020 12:06:42 +0300
Subject: [PATCH 271/341] fixup

---
 docker/test/performance-comparison/compare.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index b768d26d478..00cafadb502 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -160,11 +160,11 @@ function run_tests
     # those values.
     if [ "$PR_TO_TEST" == "0" ]
     then
-        CHPC_RUNS=${CHPC_RUNS:-7}
-        CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-100}
-    else
         CHPC_RUNS=${CHPC_RUNS:-13}
         CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-0}
+    else
+        CHPC_RUNS=${CHPC_RUNS:-7}
+        CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-100}
     fi
     export CHPC_RUNS
     export CHPC_MAX_QUERIES

From 18398c15101b1db23a298b5fa43862576044b5b3 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 12:08:39 +0300
Subject: [PATCH 272/341] Fix style

---
 src/Compression/ICompressionCodec.cpp | 2 +-
 src/Compression/ICompressionCodec.h   | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Compression/ICompressionCodec.cpp b/src/Compression/ICompressionCodec.cpp
index 021bf6f6fe6..1b2c90e5163 100644
--- a/src/Compression/ICompressionCodec.cpp
+++ b/src/Compression/ICompressionCodec.cpp
@@ -24,7 +24,7 @@ void ICompressionCodec::setCodecDescription(const String & codec_name, const AST
 {
     std::shared_ptr<ASTFunction> result = std::make_shared<ASTFunction>();
     result->name = "CODEC";
-    
+
     /// Special case for codec Multiple, which doens't have name. It's just list
     /// of other codecs.
     if (codec_name.empty())
diff --git a/src/Compression/ICompressionCodec.h b/src/Compression/ICompressionCodec.h
index c931a04bdc2..f71acb3aeda 100644
--- a/src/Compression/ICompressionCodec.h
+++ b/src/Compression/ICompressionCodec.h
@@ -87,7 +87,7 @@ protected:
 
     /// Actually decompress data without header
     virtual void doDecompressData(const char * source, UInt32 source_size, char * dest, UInt32 uncompressed_size) const = 0;
-    
+
     /// Construct and set codec description from codec name and arguments. Must be called in codec constructor.
     void setCodecDescription(const String & name, const ASTs & arguments = {});
 

From 3b8ca1f26240777643b09488394bf0f4d50acbaf Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <36882414+akuzm@users.noreply.github.com>
Date: Wed, 16 Sep 2020 12:16:07 +0300
Subject: [PATCH 273/341] Update compare.sh

---
 docker/test/performance-comparison/compare.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index 00cafadb502..18e5bea4db5 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -164,7 +164,7 @@ function run_tests
         CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-0}
     else
         CHPC_RUNS=${CHPC_RUNS:-7}
-        CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-100}
+        CHPC_MAX_QUERIES=${CHPC_MAX_QUERIES:-20}
     fi
     export CHPC_RUNS
     export CHPC_MAX_QUERIES

From 38d53c38f6ad2b7298f4be7ab8c398abb6ee36d8 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Wed, 16 Sep 2020 14:36:55 +0800
Subject: [PATCH 274/341] Explicit define what first replica is.

---
 docs/en/operations/settings/settings.md   |  2 ++
 src/Client/ConnectionPoolWithFailover.cpp | 10 ++++++++--
 src/Core/Settings.h                       |  1 +
 3 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 76fcfa2a616..596095c3df9 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -940,6 +940,8 @@ This algorithm chooses the first replica in the set or a random replica if the f
 
 The `first_or_random` algorithm solves the problem of the `in_order` algorithm. With `in_order`, if one replica goes down, the next one gets a double load while the remaining replicas handle the usual amount of traffic. When using the `first_or_random` algorithm, the load is evenly distributed among replicas that are still available.
 
+It's possible to explicitly define what the first replica is by using the setting `load_balancing_first_offset`. This gives more control to rebalance query workloads among replicas.
+
 ### Round Robin {#load_balancing-round_robin}
 
 ``` sql
diff --git a/src/Client/ConnectionPoolWithFailover.cpp b/src/Client/ConnectionPoolWithFailover.cpp
index 6d6af794a07..68f4bcd1b76 100644
--- a/src/Client/ConnectionPoolWithFailover.cpp
+++ b/src/Client/ConnectionPoolWithFailover.cpp
@@ -56,6 +56,9 @@ IConnectionPool::Entry ConnectionPoolWithFailover::get(const ConnectionTimeouts
         return tryGetEntry(pool, timeouts, fail_message, settings);
     };
 
+    size_t offset = 0;
+    if (settings)
+        offset = settings->load_balancing_first_offset % nested_pools.size();
     GetPriorityFunc get_priority;
     switch (settings ? LoadBalancing(settings->load_balancing) : default_load_balancing)
     {
@@ -68,7 +71,7 @@ IConnectionPool::Entry ConnectionPoolWithFailover::get(const ConnectionTimeouts
     case LoadBalancing::RANDOM:
         break;
     case LoadBalancing::FIRST_OR_RANDOM:
-        get_priority = [](size_t i) -> size_t { return i >= 1; };
+        get_priority = [offset](size_t i) -> size_t { return i != offset; };
         break;
     case LoadBalancing::ROUND_ROBIN:
         if (last_used >= nested_pools.size())
@@ -190,6 +193,9 @@ std::vector<ConnectionPoolWithFailover::TryResult> ConnectionPoolWithFailover::g
     else
         throw DB::Exception("Unknown pool allocation mode", DB::ErrorCodes::LOGICAL_ERROR);
 
+    size_t offset = 0;
+    if (settings)
+        offset = settings->load_balancing_first_offset % nested_pools.size();
     GetPriorityFunc get_priority;
     switch (settings ? LoadBalancing(settings->load_balancing) : default_load_balancing)
     {
@@ -202,7 +208,7 @@ std::vector<ConnectionPoolWithFailover::TryResult> ConnectionPoolWithFailover::g
     case LoadBalancing::RANDOM:
         break;
     case LoadBalancing::FIRST_OR_RANDOM:
-        get_priority = [](size_t i) -> size_t { return i >= 1; };
+        get_priority = [offset](size_t i) -> size_t { return i != offset; };
         break;
     case LoadBalancing::ROUND_ROBIN:
         if (last_used >= nested_pools.size())
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index b39c223a5e9..6a6876d0f01 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -88,6 +88,7 @@ class IColumn;
     M(UInt64, replication_alter_columns_timeout, 60, "Wait for actions to change the table structure within the specified number of seconds. 0 - wait unlimited time.", 0) \
     \
     M(LoadBalancing, load_balancing, LoadBalancing::RANDOM, "Which replicas (among healthy replicas) to preferably send a query to (on the first attempt) for distributed processing.", 0) \
+    M(UInt64, load_balancing_first_offset, 0, "Which replica to preferably send a query when FIRST_OR_RANDOM load balancing strategy is used.", 0) \
     \
     M(TotalsMode, totals_mode, TotalsMode::AFTER_HAVING_EXCLUSIVE, "How to calculate TOTALS when HAVING is present, as well as when max_rows_to_group_by and group_by_overflow_mode = ‘any’ are present.", IMPORTANT) \
     M(Float, totals_auto_threshold, 0.5, "The threshold for totals_mode = 'auto'.", 0) \

From 9e00fb44b57492dbdc5c8d32958067adb0d041ce Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 13:18:28 +0300
Subject: [PATCH 275/341] Update creating sink.

---
 src/Functions/GatherUtils/Sinks.h             | 24 +++++++++----
 src/Functions/GatherUtils/Sources.h           | 18 ++++++++++
 src/Functions/GatherUtils/createArraySink.cpp | 36 ++++++++++---------
 3 files changed, 56 insertions(+), 22 deletions(-)

diff --git a/src/Functions/GatherUtils/Sinks.h b/src/Functions/GatherUtils/Sinks.h
index 5fd943ae78b..d3c05e31c19 100644
--- a/src/Functions/GatherUtils/Sinks.h
+++ b/src/Functions/GatherUtils/Sinks.h
@@ -11,6 +11,7 @@
 #include <Columns/ColumnNullable.h>
 
 #include <Common/typeid_cast.h>
+#include <Common/assert_cast.h>
 
 namespace DB::GatherUtils
 {
@@ -44,8 +45,13 @@ struct NumericArraySink : public ArraySinkImpl<NumericArraySink<T>>
     size_t row_num = 0;
     ColumnArray::Offset current_offset = 0;
 
-    NumericArraySink(ColumnArray & arr, size_t column_size)
-            : elements(typeid_cast<ColVecType &>(arr.getData()).getData()), offsets(arr.getOffsets())
+    MutableColumnPtr createValuesColumn()
+    {
+        return ColumnVector<T>::create();
+    }
+
+    NumericArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
+            : elements(elements_), offsets(offsets_)
     {
         offsets.resize(column_size);
     }
@@ -161,8 +167,8 @@ struct GenericArraySink : public ArraySinkImpl<GenericArraySink>
     size_t row_num = 0;
     ColumnArray::Offset current_offset = 0;
 
-    GenericArraySink(ColumnArray & arr, size_t column_size)
-            : elements(arr.getData()), offsets(arr.getOffsets())
+    GenericArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
+            : elements(elements_), offsets(offsets_)
     {
         offsets.resize(column_size);
     }
@@ -198,8 +204,14 @@ struct NullableArraySink : public ArraySink
 
     NullMap & null_map;
 
-    NullableArraySink(ColumnArray & arr, NullMap & null_map_, size_t column_size)
-            : ArraySink(arr, column_size), null_map(null_map_)
+    MutableColumnPtr createValuesColumn()
+    {
+        return ColumnNullable::create(ArraySink::createValuesColumn(), ColumnUInt8::create());
+    }
+
+    NullableArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
+        : ArraySink(assert_cast<ColumnNullable &>(elements_).getNestedColumn(), offsets_, column_size)
+        , null_map(assert_cast<ColumnNullable &>(elements_).getNullMapData())
     {
     }
 
diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index fe71a1f8be3..44ff9f3f8a9 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -29,6 +29,12 @@ namespace ErrorCodes
 namespace GatherUtils
 {
 
+template <typename T> struct NumericArraySink;
+struct StringSink;
+struct FixedStringSink;
+struct GenericArraySink;
+template <typename ArraySink> struct NullableArraySink
+
 template <typename T>
 struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
 {
@@ -36,6 +42,8 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
     using Slice = NumericArraySlice<T>;
     using Column = ColumnArray;
 
+    using SinkType = NumericArraySink<T>;
+
     const typename ColVecType::Container & elements;
     const typename ColumnArray::Offsets & offsets;
 
@@ -143,6 +151,8 @@ struct ConstSource : public Base
     using Slice = typename Base::Slice;
     using Column = ColumnConst;
 
+    using SinkType = typename Base::SinkType;
+
     size_t total_rows;
     size_t row_num = 0;
 
@@ -224,6 +234,8 @@ struct StringSource
     using Slice = NumericArraySlice<UInt8>;
     using Column = ColumnString;
 
+    using SinkType = StringSink;
+
     const typename ColumnString::Chars & elements;
     const typename ColumnString::Offsets & offsets;
 
@@ -391,6 +403,8 @@ struct FixedStringSource
     using Slice = NumericArraySlice<UInt8>;
     using Column = ColumnFixedString;
 
+    using SinkType = FixedStringSink;
+
     const UInt8 * pos;
     const UInt8 * end;
     size_t string_size;
@@ -511,6 +525,8 @@ struct GenericArraySource : public ArraySourceImpl<GenericArraySource>
     using Slice = GenericArraySlice;
     using Column = ColumnArray;
 
+    using SinkType = GenericArraySink;
+
     const IColumn & elements;
     const typename ColumnArray::Offsets & offsets;
 
@@ -605,6 +621,8 @@ struct NullableArraySource : public ArraySource
     using ArraySource::row_num;
     using ArraySource::offsets;
 
+    using SinkType = NullableArraySink<typename ArraySource::SinkType>;
+
     const NullMap & null_map;
 
     NullableArraySource(const ColumnArray & arr, const NullMap & null_map_)
diff --git a/src/Functions/GatherUtils/createArraySink.cpp b/src/Functions/GatherUtils/createArraySink.cpp
index 513fe112608..85779aba9d2 100644
--- a/src/Functions/GatherUtils/createArraySink.cpp
+++ b/src/Functions/GatherUtils/createArraySink.cpp
@@ -13,40 +13,44 @@ struct ArraySinkCreator;
 template <typename Type, typename... Types>
 struct ArraySinkCreator<Type, Types...>
 {
-    static std::unique_ptr<IArraySink> create(ColumnArray & col, NullMap * null_map, size_t column_size)
+    static std::unique_ptr<IArraySink> create(IColumn & values, ColumnArray::Offsets & offsets, size_t column_size)
     {
         using ColVecType = std::conditional_t<IsDecimalNumber<Type>, ColumnDecimal<Type>, ColumnVector<Type>>;
 
-        if (typeid_cast<ColVecType *>(&col.getData()))
+        IColumn * not_null_values = &values;
+        bool is_nullable = false;
+
+        if (auto * nullable = typeid_cast<ColumnNullable *>(&values))
         {
-            if (null_map)
-                return std::make_unique<NullableArraySink<NumericArraySink<Type>>>(col, *null_map, column_size);
-            return std::make_unique<NumericArraySink<Type>>(col, column_size);
+            not_null_values = &nullable->getNestedColumn();
+            is_nullable = true;
         }
 
-        return ArraySinkCreator<Types...>::create(col, null_map, column_size);
+        if (typeid_cast<ColVecType *>(not_null_values))
+        {
+            if (is_nullable)
+                return std::make_unique<NullableArraySink<NumericArraySink<Type>>>(values, offsets, column_size);
+            return std::make_unique<NumericArraySink<Type>>(values, offsets, column_size);
+        }
+
+        return ArraySinkCreator<Types...>::create(values, offsets, column_size);
     }
 };
 
 template <>
 struct ArraySinkCreator<>
 {
-    static std::unique_ptr<IArraySink> create(ColumnArray & col, NullMap * null_map, size_t column_size)
+    static std::unique_ptr<IArraySink> create(IColumn & values, ColumnArray::Offsets & offsets, size_t column_size)
     {
-        if (null_map)
-            return std::make_unique<NullableArraySink<GenericArraySink>>(col, *null_map, column_size);
-        return std::make_unique<GenericArraySink>(col, column_size);
+        if (typeid_cast<ColumnNullable *>(&values))
+            return std::make_unique<NullableArraySink<GenericArraySink>>(values, offsets, column_size);
+        return std::make_unique<GenericArraySink>(values, offsets, column_size);
     }
 };
 
 std::unique_ptr<IArraySink> createArraySink(ColumnArray & col, size_t column_size)
 {
     using Creator = ApplyTypeListForClass<ArraySinkCreator, TypeListNumbersAndUInt128>::Type;
-    if (auto * column_nullable = typeid_cast<ColumnNullable *>(&col.getData()))
-    {
-        auto column = ColumnArray::create(column_nullable->getNestedColumnPtr()->assumeMutable(), col.getOffsetsPtr()->assumeMutable());
-        return Creator::create(*column, &column_nullable->getNullMapData(), column_size);
-    }
-    return Creator::create(col, nullptr, column_size);
+    return Creator::create(col.getData(), col.getOffsets(), column_size);
 }
 }

From 85698e04fa6aa49909448f6ee6024fd15f55bdca Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 13:57:23 +0300
Subject: [PATCH 276/341] Update slice for arrays.

---
 src/Functions/GatherUtils/GatherUtils.h       | 12 +++++-----
 src/Functions/GatherUtils/Sinks.h             | 10 --------
 src/Functions/GatherUtils/Sources.h           | 12 +++++++++-
 .../GatherUtils/sliceDynamicOffsetBounded.cpp | 15 ++++++++----
 .../sliceDynamicOffsetUnbounded.cpp           | 15 ++++++++----
 .../sliceFromLeftConstantOffsetBounded.cpp    | 15 ++++++++----
 .../sliceFromLeftConstantOffsetUnbounded.cpp  | 15 ++++++++----
 .../sliceFromRightConstantOffsetBounded.cpp   | 15 ++++++++----
 .../sliceFromRightConstantOffsetUnbounded.cpp | 15 ++++++++----
 src/Functions/array/arraySlice.cpp            | 24 +++++++++----------
 10 files changed, 88 insertions(+), 60 deletions(-)

diff --git a/src/Functions/GatherUtils/GatherUtils.h b/src/Functions/GatherUtils/GatherUtils.h
index 6699cc655e4..87e909a891e 100644
--- a/src/Functions/GatherUtils/GatherUtils.h
+++ b/src/Functions/GatherUtils/GatherUtils.h
@@ -43,14 +43,14 @@ std::unique_ptr<IArraySink> createArraySink(ColumnArray & col, size_t column_siz
 
 void concat(const std::vector<std::unique_ptr<IArraySource>> & sources, IArraySink & sink);
 
-void sliceFromLeftConstantOffsetUnbounded(IArraySource & src, IArraySink & sink, size_t offset);
-void sliceFromLeftConstantOffsetBounded(IArraySource & src, IArraySink & sink, size_t offset, ssize_t length);
+ColumnArray::MutablePtr sliceFromLeftConstantOffsetUnbounded(IArraySource & src, size_t offset);
+ColumnArray::MutablePtr sliceFromLeftConstantOffsetBounded(IArraySource & src, size_t offset, ssize_t length);
 
-void sliceFromRightConstantOffsetUnbounded(IArraySource & src, IArraySink & sink, size_t offset);
-void sliceFromRightConstantOffsetBounded(IArraySource & src, IArraySink & sink, size_t offset, ssize_t length);
+ColumnArray::MutablePtr sliceFromRightConstantOffsetUnbounded(IArraySource & src, size_t offset);
+ColumnArray::MutablePtr sliceFromRightConstantOffsetBounded(IArraySource & src, size_t offset, ssize_t length);
 
-void sliceDynamicOffsetUnbounded(IArraySource & src, IArraySink & sink, const IColumn & offset_column);
-void sliceDynamicOffsetBounded(IArraySource & src, IArraySink & sink, const IColumn & offset_column, const IColumn & length_column);
+ColumnArray::MutablePtr sliceDynamicOffsetUnbounded(IArraySource & src, const IColumn & offset_column);
+ColumnArray::MutablePtr sliceDynamicOffsetBounded(IArraySource & src, const IColumn & offset_column, const IColumn & length_column)
 
 void sliceHas(IArraySource & first, IArraySource & second, ArraySearchType search_type, ColumnUInt8 & result);
 
diff --git a/src/Functions/GatherUtils/Sinks.h b/src/Functions/GatherUtils/Sinks.h
index d3c05e31c19..e5a5a49099b 100644
--- a/src/Functions/GatherUtils/Sinks.h
+++ b/src/Functions/GatherUtils/Sinks.h
@@ -45,11 +45,6 @@ struct NumericArraySink : public ArraySinkImpl<NumericArraySink<T>>
     size_t row_num = 0;
     ColumnArray::Offset current_offset = 0;
 
-    MutableColumnPtr createValuesColumn()
-    {
-        return ColumnVector<T>::create();
-    }
-
     NumericArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
             : elements(elements_), offsets(offsets_)
     {
@@ -204,11 +199,6 @@ struct NullableArraySink : public ArraySink
 
     NullMap & null_map;
 
-    MutableColumnPtr createValuesColumn()
-    {
-        return ColumnNullable::create(ArraySink::createValuesColumn(), ColumnUInt8::create());
-    }
-
     NullableArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
         : ArraySink(assert_cast<ColumnNullable &>(elements_).getNestedColumn(), offsets_, column_size)
         , null_map(assert_cast<ColumnNullable &>(elements_).getNullMapData())
diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 44ff9f3f8a9..c650305e85d 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -33,7 +33,7 @@ template <typename T> struct NumericArraySink;
 struct StringSink;
 struct FixedStringSink;
 struct GenericArraySink;
-template <typename ArraySink> struct NullableArraySink
+template <typename ArraySink> struct NullableArraySink;
 
 template <typename T>
 struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
@@ -50,6 +50,11 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
     size_t row_num = 0;
     ColumnArray::Offset prev_offset = 0;
 
+    MutableColumnPtr createValuesColumn()
+    {
+        return ColumnVector<T>::create();
+    }
+
     explicit NumericArraySource(const ColumnArray & arr)
             : elements(typeid_cast<const ColVecType &>(arr.getData()).getData()), offsets(arr.getOffsets())
     {
@@ -533,6 +538,11 @@ struct GenericArraySource : public ArraySourceImpl<GenericArraySource>
     size_t row_num = 0;
     ColumnArray::Offset prev_offset = 0;
 
+    MutableColumnPtr createValuesColumn()
+    {
+        return elements.cloneEmpty();
+    }
+
     explicit GenericArraySource(const ColumnArray & arr)
             : elements(arr.getData()), offsets(arr.getOffsets())
     {
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
index e4ea70dd09e..85d2b5d1c34 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
@@ -6,18 +6,23 @@
 
 namespace DB::GatherUtils
 {
-struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySinkSourceSelector<SliceDynamicOffsetBoundedSelectArraySource>
+struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySourceSelector<SliceDynamicOffsetBoundedSelectArraySource>
 {
-    template <typename Source, typename Sink>
-    static void selectSourceSink(Source && source, Sink && sink, const IColumn & offset_column, const IColumn & length_column)
+    template <typename Source>
+    static void selectSourceSink(Source && source, const IColumn & offset_column, const IColumn & length_column, ColumnArray::MutablePtr & result)
     {
+        using Sink = typename Source::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceDynamicOffsetBounded(source, sink, offset_column, length_column);
     }
 };
 
-void sliceDynamicOffsetBounded(IArraySource & src, IArraySink & sink, const IColumn & offset_column, const IColumn & length_column)
+ColumnArray::MutablePtr sliceDynamicOffsetBounded(IArraySource & src, const IColumn & offset_column, const IColumn & length_column)
 {
-    SliceDynamicOffsetBoundedSelectArraySource::select(src, sink, offset_column, length_column);
+    ColumnArray::MutablePtr res;
+    SliceDynamicOffsetBoundedSelectArraySource::select(src, offset_column, length_column, res);
+    return res;
 }
 }
 
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
index ba7d6835830..2be380c4a7a 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
@@ -6,19 +6,24 @@
 
 namespace DB::GatherUtils
 {
-struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySinkSourceSelector<SliceDynamicOffsetUnboundedSelectArraySource>
+struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySourceSelector<SliceDynamicOffsetUnboundedSelectArraySource>
 {
-    template <typename Source, typename Sink>
-    static void selectSourceSink(Source && source, Sink && sink, const IColumn & offset_column)
+    template <typename Source>
+    static void selectSourceSink(Source && source, const IColumn & offset_column, ColumnArray::MutablePtr & result)
     {
+        using Sink = typename Source::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceDynamicOffsetUnbounded(source, sink, offset_column);
     }
 };
 
 
-void sliceDynamicOffsetUnbounded(IArraySource & src, IArraySink & sink, const IColumn & offset_column)
+ColumnArray::MutablePtr sliceDynamicOffsetUnbounded(IArraySource & src, const IColumn & offset_column)
 {
-    SliceDynamicOffsetUnboundedSelectArraySource::select(src, sink, offset_column);
+    ColumnArray::MutablePtr res;
+    SliceDynamicOffsetUnboundedSelectArraySource::select(src, sink, offset_column, res);
+    return res;
 }
 }
 
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
index d2f5082ad55..6abcf962a23 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
@@ -7,18 +7,23 @@
 namespace DB::GatherUtils
 {
 struct SliceFromLeftConstantOffsetBoundedSelectArraySource
-    : public ArraySinkSourceSelector<SliceFromLeftConstantOffsetBoundedSelectArraySource>
+    : public ArraySourceSelector<SliceFromLeftConstantOffsetBoundedSelectArraySource>
 {
-    template <typename Source, typename Sink>
-    static void selectSourceSink(Source && source, Sink && sink, size_t & offset, ssize_t & length)
+    template <typename Source>
+    static void selectSourceSink(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
+        using Sink = typename Source::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromLeftConstantOffsetBounded(source, sink, offset, length);
     }
 };
 
-void sliceFromLeftConstantOffsetBounded(IArraySource & src, IArraySink & sink, size_t offset, ssize_t length)
+ColumnArray::MutablePtr sliceFromLeftConstantOffsetBounded(IArraySource & src, size_t offset, ssize_t length)
 {
-    SliceFromLeftConstantOffsetBoundedSelectArraySource::select(src, sink, offset, length);
+    ColumnArray::MutablePtr res;
+    SliceFromLeftConstantOffsetBoundedSelectArraySource::select(src, offset, length, res);
+    return res;
 }
 }
 
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
index 6f283d0dfec..3027ec954e0 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
@@ -7,18 +7,23 @@
 namespace DB::GatherUtils
 {
 struct SliceFromLeftConstantOffsetUnboundedSelectArraySource
-    : public ArraySinkSourceSelector<SliceFromLeftConstantOffsetUnboundedSelectArraySource>
+    : public ArraySourceSelector<SliceFromLeftConstantOffsetUnboundedSelectArraySource>
 {
-    template <typename Source, typename Sink>
-    static void selectSourceSink(Source && source, Sink && sink, size_t & offset)
+    template <typename Source>
+    static void selectSourceSink(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
+        using Sink = typename Source::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromLeftConstantOffsetUnbounded(source, sink, offset);
     }
 };
 
-void sliceFromLeftConstantOffsetUnbounded(IArraySource & src, IArraySink & sink, size_t offset)
+ColumnArray::MutablePtr sliceFromLeftConstantOffsetUnbounded(IArraySource & src, size_t offset)
 {
-    SliceFromLeftConstantOffsetUnboundedSelectArraySource::select(src, sink, offset);
+    ColumnArray::MutablePtr res;
+    SliceFromLeftConstantOffsetUnboundedSelectArraySource::select(src, offset, res);
+    return res;
 }
 }
 
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
index 1a6385924f4..37f42dc39f6 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
@@ -7,18 +7,23 @@
 namespace DB::GatherUtils
 {
 struct SliceFromRightConstantOffsetBoundedSelectArraySource
-    : public ArraySinkSourceSelector<SliceFromRightConstantOffsetBoundedSelectArraySource>
+    : public ArraySourceSelector<SliceFromRightConstantOffsetBoundedSelectArraySource>
 {
-    template <typename Source, typename Sink>
-    static void selectSourceSink(Source && source, Sink && sink, size_t & offset, ssize_t & length)
+    template <typename Source>
+    static void selectSourceSink(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
+        using Sink = typename Source::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromRightConstantOffsetBounded(source, sink, offset, length);
     }
 };
 
-void sliceFromRightConstantOffsetBounded(IArraySource & src, IArraySink & sink, size_t offset, ssize_t length)
+ColumnArray::MutablePtr sliceFromRightConstantOffsetBounded(IArraySource & src, size_t offset, ssize_t length)
 {
-    SliceFromRightConstantOffsetBoundedSelectArraySource::select(src, sink, offset, length);
+    ColumnArray::MutablePtr res;
+    SliceFromRightConstantOffsetBoundedSelectArraySource::select(src, offset, length, res);
+    return res;
 }
 }
 
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
index e669c5d50b8..63e6b6a0633 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
@@ -7,18 +7,23 @@
 namespace DB::GatherUtils
 {
 struct SliceFromRightConstantOffsetUnboundedSelectArraySource
-    : public ArraySinkSourceSelector<SliceFromRightConstantOffsetUnboundedSelectArraySource>
+    : public ArraySourceSelector<SliceFromRightConstantOffsetUnboundedSelectArraySource>
 {
-    template <typename Source, typename Sink>
-    static void selectSourceSink(Source && source, Sink && sink, size_t & offset)
+    template <typename Source>
+    static void selectSourceSink(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
+        using Sink = typename Source::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromRightConstantOffsetUnbounded(source, sink, offset);
     }
 };
 
-void sliceFromRightConstantOffsetUnbounded(IArraySource & src, IArraySink & sink, size_t offset)
+ColumnArray::MutablePtr sliceFromRightConstantOffsetUnbounded(IArraySource & src, size_t offset)
 {
-    SliceFromRightConstantOffsetUnboundedSelectArraySource::select(src, sink, offset);
+    ColumnArray::MutablePtr res;
+    SliceFromRightConstantOffsetUnboundedSelectArraySource::select(src, offset, res);
+    return res;
 }
 }
 
diff --git a/src/Functions/array/arraySlice.cpp b/src/Functions/array/arraySlice.cpp
index 463e20845cf..4cf7f62d991 100644
--- a/src/Functions/array/arraySlice.cpp
+++ b/src/Functions/array/arraySlice.cpp
@@ -79,8 +79,6 @@ public:
             return;
         }
 
-        auto result_column = return_type->createColumn();
-
         auto & array_column = block.getByPosition(arguments[0]).column;
         const auto & offset_column = block.getByPosition(arguments[1]).column;
         const auto & length_column = arguments.size() > 2 ? block.getByPosition(arguments[2]).column : nullptr;
@@ -101,7 +99,7 @@ public:
         else
             throw Exception{"First arguments for function " + getName() + " must be array.", ErrorCodes::LOGICAL_ERROR};
 
-        auto sink = GatherUtils::createArraySink(typeid_cast<ColumnArray &>(*result_column), size);
+        ColumnArray::MutablePtr sink;
 
         if (offset_column->onlyNull())
         {
@@ -111,11 +109,11 @@ public:
                 return;
             }
             else if (isColumnConst(*length_column))
-                GatherUtils::sliceFromLeftConstantOffsetBounded(*source, *sink, 0, length_column->getInt(0));
+                sink = GatherUtils::sliceFromLeftConstantOffsetBounded(*source, 0, length_column->getInt(0));
             else
             {
                 auto const_offset_column = ColumnConst::create(ColumnInt8::create(1, 1), size);
-                GatherUtils::sliceDynamicOffsetBounded(*source, *sink, *const_offset_column, *length_column);
+                sink = GatherUtils::sliceDynamicOffsetBounded(*source, *const_offset_column, *length_column);
             }
         }
         else if (isColumnConst(*offset_column))
@@ -125,30 +123,30 @@ public:
             if (!length_column || length_column->onlyNull())
             {
                 if (offset > 0)
-                    GatherUtils::sliceFromLeftConstantOffsetUnbounded(*source, *sink, static_cast<size_t>(offset - 1));
+                    sink = GatherUtils::sliceFromLeftConstantOffsetUnbounded(*source, static_cast<size_t>(offset - 1));
                 else
-                    GatherUtils::sliceFromRightConstantOffsetUnbounded(*source, *sink, static_cast<size_t>(-offset));
+                    sink = GatherUtils::sliceFromRightConstantOffsetUnbounded(*source, static_cast<size_t>(-offset));
             }
             else if (isColumnConst(*length_column))
             {
                 ssize_t length = length_column->getInt(0);
                 if (offset > 0)
-                    GatherUtils::sliceFromLeftConstantOffsetBounded(*source, *sink, static_cast<size_t>(offset - 1), length);
+                    sink = GatherUtils::sliceFromLeftConstantOffsetBounded(*source, static_cast<size_t>(offset - 1), length);
                 else
-                    GatherUtils::sliceFromRightConstantOffsetBounded(*source, *sink, static_cast<size_t>(-offset), length);
+                    sink = GatherUtils::sliceFromRightConstantOffsetBounded(*source, static_cast<size_t>(-offset), length);
             }
             else
-                GatherUtils::sliceDynamicOffsetBounded(*source, *sink, *offset_column, *length_column);
+                sink = GatherUtils::sliceDynamicOffsetBounded(*source, *offset_column, *length_column);
         }
         else
         {
             if (!length_column || length_column->onlyNull())
-                GatherUtils::sliceDynamicOffsetUnbounded(*source, *sink, *offset_column);
+                sink = GatherUtils::sliceDynamicOffsetUnbounded(*source, *offset_column);
             else
-                GatherUtils::sliceDynamicOffsetBounded(*source, *sink, *offset_column, *length_column);
+                sink = GatherUtils::sliceDynamicOffsetBounded(*source, *offset_column, *length_column);
         }
 
-        block.getByPosition(result).column = std::move(result_column);
+        block.getByPosition(result).column = std::move(sink);
     }
 
     bool useDefaultImplementationForConstants() const override { return true; }

From 6c6e0a88c645585f5b47c59cd7260590f5c7429f Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 14:22:08 +0300
Subject: [PATCH 277/341] Fix build.

---
 src/Functions/GatherUtils/GatherUtils.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/GatherUtils.h b/src/Functions/GatherUtils/GatherUtils.h
index 87e909a891e..f383b9f4e7f 100644
--- a/src/Functions/GatherUtils/GatherUtils.h
+++ b/src/Functions/GatherUtils/GatherUtils.h
@@ -50,7 +50,7 @@ ColumnArray::MutablePtr sliceFromRightConstantOffsetUnbounded(IArraySource & src
 ColumnArray::MutablePtr sliceFromRightConstantOffsetBounded(IArraySource & src, size_t offset, ssize_t length);
 
 ColumnArray::MutablePtr sliceDynamicOffsetUnbounded(IArraySource & src, const IColumn & offset_column);
-ColumnArray::MutablePtr sliceDynamicOffsetBounded(IArraySource & src, const IColumn & offset_column, const IColumn & length_column)
+ColumnArray::MutablePtr sliceDynamicOffsetBounded(IArraySource & src, const IColumn & offset_column, const IColumn & length_column);
 
 void sliceHas(IArraySource & first, IArraySource & second, ArraySearchType search_type, ColumnUInt8 & result);
 

From a12521dd4d699b06244eec159b2a0b3cdf3450e8 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 14:27:29 +0300
Subject: [PATCH 278/341] Remove clang-11 build for release

---
 base/glibc-compatibility/CMakeLists.txt | 3 ---
 tests/ci/ci_config.json                 | 4 ++--
 2 files changed, 2 insertions(+), 5 deletions(-)

diff --git a/base/glibc-compatibility/CMakeLists.txt b/base/glibc-compatibility/CMakeLists.txt
index 42b478d50d9..2bd4e20d3bc 100644
--- a/base/glibc-compatibility/CMakeLists.txt
+++ b/base/glibc-compatibility/CMakeLists.txt
@@ -34,9 +34,6 @@ if (GLIBC_COMPATIBILITY)
 
     if (COMPILER_CLANG)
         target_compile_options(glibc-compatibility PRIVATE -Wno-unused-command-line-argument)
-        # disable lto for this library, because for some reason clang-11 fails
-        # to link llvm with it.
-        target_compile_options(glibc-compatibility PRIVATE -fno-lto)
     elseif (COMPILER_GCC)
         target_compile_options(glibc-compatibility PRIVATE -Wno-unused-but-set-variable)
     endif ()
diff --git a/tests/ci/ci_config.json b/tests/ci/ci_config.json
index 781b11a5059..15ba05c4efe 100644
--- a/tests/ci/ci_config.json
+++ b/tests/ci/ci_config.json
@@ -72,7 +72,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-11",
+            "compiler": "clang-10",
             "build-type": "",
             "sanitizer": "",
             "package-type": "deb",
@@ -102,7 +102,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-11",
+            "compiler": "clang-10",
             "build-type": "",
             "sanitizer": "",
             "package-type": "binary",

From 22e3d471b603c4a71611a04c2bf95bfb495f8db2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 14:29:43 +0300
Subject: [PATCH 279/341] Fix build.

---
 src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp         | 2 +-
 src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp       | 2 +-
 .../GatherUtils/sliceFromLeftConstantOffsetBounded.cpp          | 2 +-
 .../GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp        | 2 +-
 .../GatherUtils/sliceFromRightConstantOffsetBounded.cpp         | 2 +-
 .../GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp       | 2 +-
 6 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
index 85d2b5d1c34..e30c825c297 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
@@ -9,7 +9,7 @@ namespace DB::GatherUtils
 struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySourceSelector<SliceDynamicOffsetBoundedSelectArraySource>
 {
     template <typename Source>
-    static void selectSourceSink(Source && source, const IColumn & offset_column, const IColumn & length_column, ColumnArray::MutablePtr & result)
+    static void selectImpl(Source && source, const IColumn & offset_column, const IColumn & length_column, ColumnArray::MutablePtr & result)
     {
         using Sink = typename Source::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
index 2be380c4a7a..9c2d3d84867 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
@@ -9,7 +9,7 @@ namespace DB::GatherUtils
 struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySourceSelector<SliceDynamicOffsetUnboundedSelectArraySource>
 {
     template <typename Source>
-    static void selectSourceSink(Source && source, const IColumn & offset_column, ColumnArray::MutablePtr & result)
+    static void selectImpl(Source && source, const IColumn & offset_column, ColumnArray::MutablePtr & result)
     {
         using Sink = typename Source::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
index 6abcf962a23..5924295e0e6 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
@@ -10,7 +10,7 @@ struct SliceFromLeftConstantOffsetBoundedSelectArraySource
     : public ArraySourceSelector<SliceFromLeftConstantOffsetBoundedSelectArraySource>
 {
     template <typename Source>
-    static void selectSourceSink(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
+    static void selectImpl(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
         using Sink = typename Source::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
index 3027ec954e0..fd3d5d3cd5f 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
@@ -10,7 +10,7 @@ struct SliceFromLeftConstantOffsetUnboundedSelectArraySource
     : public ArraySourceSelector<SliceFromLeftConstantOffsetUnboundedSelectArraySource>
 {
     template <typename Source>
-    static void selectSourceSink(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
+    static void selectImpl(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
         using Sink = typename Source::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
index 37f42dc39f6..276c13456d0 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
@@ -10,7 +10,7 @@ struct SliceFromRightConstantOffsetBoundedSelectArraySource
     : public ArraySourceSelector<SliceFromRightConstantOffsetBoundedSelectArraySource>
 {
     template <typename Source>
-    static void selectSourceSink(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
+    static void selectImpl(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
         using Sink = typename Source::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
index 63e6b6a0633..52abf5b0385 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
@@ -10,7 +10,7 @@ struct SliceFromRightConstantOffsetUnboundedSelectArraySource
     : public ArraySourceSelector<SliceFromRightConstantOffsetUnboundedSelectArraySource>
 {
     template <typename Source>
-    static void selectSourceSink(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
+    static void selectImpl(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
         using Sink = typename Source::SinkType;
         result = ColumnArray::create(source.createValuesColumn());

From 9a92e5eabbbcbb4cdf9d7e3fcd99488972438cdc Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 14:33:29 +0300
Subject: [PATCH 280/341] Fix build.

---
 src/Functions/GatherUtils/Sources.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index c650305e85d..37b344be6b6 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -52,7 +52,7 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
 
     MutableColumnPtr createValuesColumn()
     {
-        return ColumnVector<T>::create();
+        return ColVecType::create();
     }
 
     explicit NumericArraySource(const ColumnArray & arr)

From 0800ceab5a2f70e5a3a9c5c02a111ec3fcd927ba Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 14:39:42 +0300
Subject: [PATCH 281/341] Fix build.

---
 src/Functions/GatherUtils/Sinks.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/Sinks.h b/src/Functions/GatherUtils/Sinks.h
index e5a5a49099b..09db44ed261 100644
--- a/src/Functions/GatherUtils/Sinks.h
+++ b/src/Functions/GatherUtils/Sinks.h
@@ -46,7 +46,7 @@ struct NumericArraySink : public ArraySinkImpl<NumericArraySink<T>>
     ColumnArray::Offset current_offset = 0;
 
     NumericArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
-            : elements(elements_), offsets(offsets_)
+            : elements(assert_cast<ColVecType&>(elements_)), offsets(offsets_)
     {
         offsets.resize(column_size);
     }

From 8bc45c9d4235a86e84a8ca13c4ef98d1ea9f560e Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 14:49:59 +0300
Subject: [PATCH 282/341] Fix build.

---
 src/Functions/GatherUtils/Sources.h                         | 6 ++++--
 src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp     | 2 +-
 src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp   | 2 +-
 .../GatherUtils/sliceFromLeftConstantOffsetBounded.cpp      | 2 +-
 .../GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp    | 2 +-
 .../GatherUtils/sliceFromRightConstantOffsetBounded.cpp     | 2 +-
 .../GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp   | 2 +-
 7 files changed, 10 insertions(+), 8 deletions(-)

diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 37b344be6b6..5e7c79a7e4c 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -44,6 +44,7 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
 
     using SinkType = NumericArraySink<T>;
 
+    const ColVecType & column;
     const typename ColVecType::Container & elements;
     const typename ColumnArray::Offsets & offsets;
 
@@ -52,11 +53,12 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
 
     MutableColumnPtr createValuesColumn()
     {
-        return ColVecType::create();
+        return column.cloneEmpty();
     }
 
     explicit NumericArraySource(const ColumnArray & arr)
-            : elements(typeid_cast<const ColVecType &>(arr.getData()).getData()), offsets(arr.getOffsets())
+            : column(typeid_cast<const ColVecType &>(arr.getData()))
+            , elements(typeid_cast<const ColVecType &>(arr.getData()).getData()), offsets(arr.getOffsets())
     {
     }
 
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
index e30c825c297..dff7f758384 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
@@ -11,7 +11,7 @@ struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySourceSelector<S
     template <typename Source>
     static void selectImpl(Source && source, const IColumn & offset_column, const IColumn & length_column, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename Source::SinkType;
+        using Sink = typename std::remove_cv<Source>::type::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceDynamicOffsetBounded(source, sink, offset_column, length_column);
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
index 9c2d3d84867..a7ce66ec719 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
@@ -11,7 +11,7 @@ struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySourceSelector
     template <typename Source>
     static void selectImpl(Source && source, const IColumn & offset_column, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename Source::SinkType;
+        using Sink = typename std::remove_cv<Source>::type::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceDynamicOffsetUnbounded(source, sink, offset_column);
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
index 5924295e0e6..25de2517559 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
@@ -12,7 +12,7 @@ struct SliceFromLeftConstantOffsetBoundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename Source::SinkType;
+        using Sink = typename std::remove_cv<Source>::type::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromLeftConstantOffsetBounded(source, sink, offset, length);
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
index fd3d5d3cd5f..3053ad74648 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
@@ -12,7 +12,7 @@ struct SliceFromLeftConstantOffsetUnboundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename Source::SinkType;
+        using Sink = typename std::remove_cv<Source>::type::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromLeftConstantOffsetUnbounded(source, sink, offset);
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
index 276c13456d0..0c254540d19 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
@@ -12,7 +12,7 @@ struct SliceFromRightConstantOffsetBoundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename Source::SinkType;
+        using Sink = typename std::remove_cv<Source>::type::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromRightConstantOffsetBounded(source, sink, offset, length);
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
index 52abf5b0385..fc1162770de 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
@@ -12,7 +12,7 @@ struct SliceFromRightConstantOffsetUnboundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename Source::SinkType;
+        using Sink = typename std::remove_cv<Source>::type::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromRightConstantOffsetUnbounded(source, sink, offset);

From 675b2c44af1da0e474373045a116b1e3abde458b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 14:56:37 +0300
Subject: [PATCH 283/341] Fix build.

---
 src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
index a7ce66ec719..7f23353ec9e 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
@@ -22,7 +22,7 @@ struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySourceSelector
 ColumnArray::MutablePtr sliceDynamicOffsetUnbounded(IArraySource & src, const IColumn & offset_column)
 {
     ColumnArray::MutablePtr res;
-    SliceDynamicOffsetUnboundedSelectArraySource::select(src, sink, offset_column, res);
+    SliceDynamicOffsetUnboundedSelectArraySource::select(src, offset_column, res);
     return res;
 }
 }

From 5acf73d8733f67fdaa6f5887d0e4abbee1be9bef Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 15:00:34 +0300
Subject: [PATCH 284/341] Fix build.

---
 src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp        | 3 ++-
 src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp      | 3 ++-
 .../GatherUtils/sliceFromLeftConstantOffsetBounded.cpp         | 3 ++-
 .../GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp       | 3 ++-
 .../GatherUtils/sliceFromRightConstantOffsetBounded.cpp        | 3 ++-
 .../GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp      | 3 ++-
 6 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
index dff7f758384..efc214e984b 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
@@ -11,7 +11,8 @@ struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySourceSelector<S
     template <typename Source>
     static void selectImpl(Source && source, const IColumn & offset_column, const IColumn & length_column, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename std::remove_cv<Source>::type::SinkType;
+        using SourceType = typename std::remove_cv<Source>::type;
+        using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceDynamicOffsetBounded(source, sink, offset_column, length_column);
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
index 7f23353ec9e..62e719620fc 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
@@ -11,7 +11,8 @@ struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySourceSelector
     template <typename Source>
     static void selectImpl(Source && source, const IColumn & offset_column, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename std::remove_cv<Source>::type::SinkType;
+        using SourceType = typename std::remove_cv<Source>::type;
+        using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceDynamicOffsetUnbounded(source, sink, offset_column);
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
index 25de2517559..19c7d96b0b5 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
@@ -12,7 +12,8 @@ struct SliceFromLeftConstantOffsetBoundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename std::remove_cv<Source>::type::SinkType;
+        using SourceType = typename std::remove_cv<Source>::type;
+        using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromLeftConstantOffsetBounded(source, sink, offset, length);
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
index 3053ad74648..b6a469c8a36 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
@@ -12,7 +12,8 @@ struct SliceFromLeftConstantOffsetUnboundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename std::remove_cv<Source>::type::SinkType;
+        using SourceType = typename std::remove_cv<Source>::type;
+        using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromLeftConstantOffsetUnbounded(source, sink, offset);
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
index 0c254540d19..d7768516d93 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
@@ -12,7 +12,8 @@ struct SliceFromRightConstantOffsetBoundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename std::remove_cv<Source>::type::SinkType;
+        using SourceType = typename std::remove_cv<Source>::type;
+        using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromRightConstantOffsetBounded(source, sink, offset, length);
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
index fc1162770de..924f5ffaac7 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
@@ -12,7 +12,8 @@ struct SliceFromRightConstantOffsetUnboundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
-        using Sink = typename std::remove_cv<Source>::type::SinkType;
+        using SourceType = typename std::remove_cv<Source>::type;
+        using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
         sliceFromRightConstantOffsetUnbounded(source, sink, offset);

From dcb52c1d1dc6c5274816b21ef764c8fea44a721a Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 15:05:24 +0300
Subject: [PATCH 285/341] Fix build.

---
 src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp         | 2 +-
 src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp       | 2 +-
 .../GatherUtils/sliceFromLeftConstantOffsetBounded.cpp          | 2 +-
 .../GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp        | 2 +-
 .../GatherUtils/sliceFromRightConstantOffsetBounded.cpp         | 2 +-
 .../GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp       | 2 +-
 6 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
index efc214e984b..8354b16a1e2 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetBounded.cpp
@@ -11,7 +11,7 @@ struct SliceDynamicOffsetBoundedSelectArraySource : public ArraySourceSelector<S
     template <typename Source>
     static void selectImpl(Source && source, const IColumn & offset_column, const IColumn & length_column, ColumnArray::MutablePtr & result)
     {
-        using SourceType = typename std::remove_cv<Source>::type;
+        using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
diff --git a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
index 62e719620fc..a0e1ea98642 100644
--- a/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceDynamicOffsetUnbounded.cpp
@@ -11,7 +11,7 @@ struct SliceDynamicOffsetUnboundedSelectArraySource : public ArraySourceSelector
     template <typename Source>
     static void selectImpl(Source && source, const IColumn & offset_column, ColumnArray::MutablePtr & result)
     {
-        using SourceType = typename std::remove_cv<Source>::type;
+        using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
index 19c7d96b0b5..2b8ffe13f06 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetBounded.cpp
@@ -12,7 +12,7 @@ struct SliceFromLeftConstantOffsetBoundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
-        using SourceType = typename std::remove_cv<Source>::type;
+        using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
diff --git a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
index b6a469c8a36..d62d7477c24 100644
--- a/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromLeftConstantOffsetUnbounded.cpp
@@ -12,7 +12,7 @@ struct SliceFromLeftConstantOffsetUnboundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
-        using SourceType = typename std::remove_cv<Source>::type;
+        using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
index d7768516d93..52396084b9b 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetBounded.cpp
@@ -12,7 +12,7 @@ struct SliceFromRightConstantOffsetBoundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ssize_t & length, ColumnArray::MutablePtr & result)
     {
-        using SourceType = typename std::remove_cv<Source>::type;
+        using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
diff --git a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
index 924f5ffaac7..95a6ea6cedb 100644
--- a/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
+++ b/src/Functions/GatherUtils/sliceFromRightConstantOffsetUnbounded.cpp
@@ -12,7 +12,7 @@ struct SliceFromRightConstantOffsetUnboundedSelectArraySource
     template <typename Source>
     static void selectImpl(Source && source, size_t & offset, ColumnArray::MutablePtr & result)
     {
-        using SourceType = typename std::remove_cv<Source>::type;
+        using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());

From 4079a7f319787e94f1bdf469bf0054e6fa8cca32 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 15:13:34 +0300
Subject: [PATCH 286/341] Fix build.

---
 src/Functions/GatherUtils/Sources.h | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 5e7c79a7e4c..ea5ac5d8060 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -14,6 +14,7 @@
 #include "IArraySource.h"
 #include "IValueSource.h"
 #include "Slices.h"
+#include "ValueSourceVisitor.h"
 #include <Functions/FunctionHelpers.h>
 
 
@@ -29,12 +30,6 @@ namespace ErrorCodes
 namespace GatherUtils
 {
 
-template <typename T> struct NumericArraySink;
-struct StringSink;
-struct FixedStringSink;
-struct GenericArraySink;
-template <typename ArraySink> struct NullableArraySink;
-
 template <typename T>
 struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
 {
@@ -704,6 +699,8 @@ struct NumericValueSource : ValueSourceImpl<NumericValueSource<T>>
     using Slice = NumericValueSlice<T>;
     using Column = std::conditional_t<IsDecimalNumber<T>, ColumnDecimal<T>, ColumnVector<T>>;
 
+    using SinkType = NumericArraySink<T>;
+
     const T * begin;
     size_t total_rows;
     size_t row_num = 0;
@@ -746,6 +743,7 @@ struct NumericValueSource : ValueSourceImpl<NumericValueSource<T>>
 struct GenericValueSource : public ValueSourceImpl<GenericValueSource>
 {
     using Slice = GenericValueSlice;
+    using SinkType = GenericArraySink;
 
     const IColumn * column;
     size_t total_rows;
@@ -789,6 +787,8 @@ struct GenericValueSource : public ValueSourceImpl<GenericValueSource>
 template <typename ValueSource>
 struct NullableValueSource : public ValueSource
 {
+    using SinkType = NullableArraySink<typename ValueSource::SinkType>;
+
     using Slice = NullableSlice<typename ValueSource::Slice>;
     using ValueSource::row_num;
 

From 589fd6714670eb5b04603eb56047d52ee3fa3d17 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 15:15:14 +0300
Subject: [PATCH 287/341] Fix build.

---
 src/Functions/GatherUtils/Sinks.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/Sinks.h b/src/Functions/GatherUtils/Sinks.h
index 09db44ed261..cdf4408b544 100644
--- a/src/Functions/GatherUtils/Sinks.h
+++ b/src/Functions/GatherUtils/Sinks.h
@@ -46,7 +46,7 @@ struct NumericArraySink : public ArraySinkImpl<NumericArraySink<T>>
     ColumnArray::Offset current_offset = 0;
 
     NumericArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
-            : elements(assert_cast<ColVecType&>(elements_)), offsets(offsets_)
+            : elements(assert_cast<ColVecType&>(elements_).getData()), offsets(offsets_)
     {
         offsets.resize(column_size);
     }

From b31ce6a536f72511ef2372a9aa6c844143ea2fd5 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 15:19:00 +0300
Subject: [PATCH 288/341] Fix build.

---
 src/Functions/GatherUtils/Sources.h | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index ea5ac5d8060..cc7f2b662b6 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -14,7 +14,6 @@
 #include "IArraySource.h"
 #include "IValueSource.h"
 #include "Slices.h"
-#include "ValueSourceVisitor.h"
 #include <Functions/FunctionHelpers.h>
 
 
@@ -30,6 +29,12 @@ namespace ErrorCodes
 namespace GatherUtils
 {
 
+template <typename T> struct NumericArraySink;
+struct StringSink;
+struct FixedStringSink;
+struct GenericArraySink;
+template <typename ArraySink> struct NullableArraySink;
+
 template <typename T>
 struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
 {

From e9de8c88756aac38fadc51e5db3a3a7832309a10 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 15:21:26 +0300
Subject: [PATCH 289/341] Fix build.

---
 src/Functions/array/arrayPop.h | 10 ++++------
 1 file changed, 4 insertions(+), 6 deletions(-)

diff --git a/src/Functions/array/arrayPop.h b/src/Functions/array/arrayPop.h
index 45cbd091ddf..7c32acb78b4 100644
--- a/src/Functions/array/arrayPop.h
+++ b/src/Functions/array/arrayPop.h
@@ -48,8 +48,6 @@ public:
             return;
         }
 
-        auto result_column = return_type->createColumn();
-
         const auto & array_column = block.getByPosition(arguments[0]).column;
 
         std::unique_ptr<GatherUtils::IArraySource> source;
@@ -61,14 +59,14 @@ public:
         else
             throw Exception{"First arguments for function " + getName() + " must be array.", ErrorCodes::LOGICAL_ERROR};
 
-        auto sink = GatherUtils::createArraySink(typeid_cast<ColumnArray &>(*result_column), size);
+        ColumnArray::MutablePtr sink;
 
         if (pop_front)
-            GatherUtils::sliceFromLeftConstantOffsetUnbounded(*source, *sink, 1);
+            sink = GatherUtils::sliceFromLeftConstantOffsetUnbounded(*source, 1);
         else
-            GatherUtils::sliceFromLeftConstantOffsetBounded(*source, *sink, 0, -1);
+            sink = GatherUtils::sliceFromLeftConstantOffsetBounded(*source, 0, -1);
 
-        block.getByPosition(result).column = std::move(result_column);
+        block.getByPosition(result).column = std::move(sink);
     }
 
     bool useDefaultImplementationForConstants() const override { return true; }

From d36e84cde9241c77832eeeee25f7422c02a8dce5 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 15:36:54 +0300
Subject: [PATCH 290/341] Fix build.

---
 src/Functions/if.cpp | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 584bed3f8c5..32a314ba547 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -272,11 +272,12 @@ private:
                     return false;
 
                 auto res = block.getByPosition(result).type->createColumn();
+                auto & arr_res = assert_cast<ColumnArray &>(*res);
 
                 conditional(
                     NumericArraySource<T0>(*col_left_array),
                     NumericArraySource<T1>(*col_right_array),
-                    NumericArraySink<ResultType>(assert_cast<ColumnArray &>(*res), input_rows_count),
+                    NumericArraySink<ResultType>(arr_res.getData(), arr_res.getOffsets(), input_rows_count),
                     cond_col->getData());
 
                 block.getByPosition(result).column = std::move(res);
@@ -289,11 +290,12 @@ private:
                     return false;
 
                 auto res = block.getByPosition(result).type->createColumn();
+                auto & arr_res = assert_cast<ColumnArray &>(*res);
 
                 conditional(
                     NumericArraySource<T0>(*col_left_array),
                     ConstSource<NumericArraySource<T1>>(*col_right_const_array),
-                    NumericArraySink<ResultType>(assert_cast<ColumnArray &>(*res), input_rows_count),
+                    NumericArraySink<ResultType>(arr_res.getData(), arr_res.getOffsets(), input_rows_count),
                     cond_col->getData());
 
                 block.getByPosition(result).column = std::move(res);
@@ -329,11 +331,12 @@ private:
                     return false;
 
                 auto res = block.getByPosition(result).type->createColumn();
+                auto & arr_res = assert_cast<ColumnArray &>(*res);
 
                 conditional(
                     ConstSource<NumericArraySource<T0>>(*col_left_const_array),
                     NumericArraySource<T1>(*col_right_array),
-                    NumericArraySink<ResultType>(assert_cast<ColumnArray &>(*res), input_rows_count),
+                    NumericArraySink<ResultType>(arr_res.getData(), arr_res.getOffsets(), input_rows_count),
                     cond_col->getData());
 
                 block.getByPosition(result).column = std::move(res);
@@ -346,11 +349,12 @@ private:
                     return false;
 
                 auto res = block.getByPosition(result).type->createColumn();
+                auto & arr_res = assert_cast<ColumnArray &>(*res);
 
                 conditional(
                     ConstSource<NumericArraySource<T0>>(*col_left_const_array),
                     ConstSource<NumericArraySource<T1>>(*col_right_const_array),
-                    NumericArraySink<ResultType>(assert_cast<ColumnArray &>(*res), input_rows_count),
+                    NumericArraySink<ResultType>(arr_res.getData(), arr_res.getOffsets(), input_rows_count),
                     cond_col->getData());
 
                 block.getByPosition(result).column = std::move(res);

From bbb89d10de9f276130412ded673aa5d68dc5bd4f Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 15:40:18 +0300
Subject: [PATCH 291/341] Fix build.

---
 src/Functions/if.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 32a314ba547..9afa5e8240d 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -531,13 +531,13 @@ private:
             auto * col_res = assert_cast<ColumnArray *>(res.get());
 
             if (col_arr_then && col_arr_else)
-                conditional(GenericArraySource(*col_arr_then), GenericArraySource(*col_arr_else), GenericArraySink(*col_res, rows), cond_data);
+                conditional(GenericArraySource(*col_arr_then), GenericArraySource(*col_arr_else), GenericArraySink(col_res->getData(), col_res->getOffsets(), rows), cond_data);
             else if (col_arr_then && col_arr_else_const)
-                conditional(GenericArraySource(*col_arr_then), ConstSource<GenericArraySource>(*col_arr_else_const), GenericArraySink(*col_res, rows), cond_data);
+                conditional(GenericArraySource(*col_arr_then), ConstSource<GenericArraySource>(*col_arr_else_const), GenericArraySink(col_res->getData(), col_res->getOffsets(), rows), cond_data);
             else if (col_arr_then_const && col_arr_else)
-                conditional(ConstSource<GenericArraySource>(*col_arr_then_const), GenericArraySource(*col_arr_else), GenericArraySink(*col_res, rows), cond_data);
+                conditional(ConstSource<GenericArraySource>(*col_arr_then_const), GenericArraySource(*col_arr_else), GenericArraySink(col_res->getData(), col_res->getOffsets(), rows), cond_data);
             else if (col_arr_then_const && col_arr_else_const)
-                conditional(ConstSource<GenericArraySource>(*col_arr_then_const), ConstSource<GenericArraySource>(*col_arr_else_const), GenericArraySink(*col_res, rows), cond_data);
+                conditional(ConstSource<GenericArraySource>(*col_arr_then_const), ConstSource<GenericArraySource>(*col_arr_else_const), GenericArraySink(col_res->getData(), col_res->getOffsets(), rows), cond_data);
             else
                 return false;
 

From 3e576a29c9289df12f5df4c917bdfe47cbf1df59 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Wed, 16 Sep 2020 20:44:05 +0800
Subject: [PATCH 292/341] explict column list in columns matcher (#14775)

---
 .../TranslateQualifiedNamesVisitor.cpp        | 22 +++++++++++++------
 src/Parsers/ASTColumnsMatcher.cpp             |  8 +++++--
 src/Parsers/ASTColumnsMatcher.h               |  2 ++
 src/Parsers/ExpressionElementParsers.cpp      | 17 +++++++++++---
 .../01470_columns_transformers.reference      |  6 +++++
 .../01470_columns_transformers.sql            |  4 ++++
 6 files changed, 47 insertions(+), 12 deletions(-)

diff --git a/src/Interpreters/TranslateQualifiedNamesVisitor.cpp b/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
index e28997f0ad6..74622c72865 100644
--- a/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
+++ b/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
@@ -250,18 +250,26 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
         }
         else if (const auto * asterisk_pattern = child->as<ASTColumnsMatcher>())
         {
-            bool first_table = true;
-            for (const auto & table : tables_with_columns)
+            if (asterisk_pattern->column_list)
             {
-                for (const auto & column : table.columns)
+                for (const auto & ident : asterisk_pattern->column_list->children)
+                    node.children.emplace_back(ident->clone());
+            }
+            else
+            {
+                bool first_table = true;
+                for (const auto & table : tables_with_columns)
                 {
-                    if (asterisk_pattern->isColumnMatching(column.name) && (first_table || !data.join_using_columns.count(column.name)))
+                    for (const auto & column : table.columns)
                     {
-                        addIdentifier(node.children, table.table, column.name, AsteriskSemantic::getAliases(*asterisk_pattern));
+                        if (asterisk_pattern->isColumnMatching(column.name) && (first_table || !data.join_using_columns.count(column.name)))
+                        {
+                            addIdentifier(node.children, table.table, column.name, AsteriskSemantic::getAliases(*asterisk_pattern));
+                        }
                     }
-                }
 
-                first_table = false;
+                    first_table = false;
+                }
             }
             // ColumnsMatcher's transformers start to appear at child 1
             for (auto it = asterisk_pattern->children.begin() + 1; it != asterisk_pattern->children.end(); ++it)
diff --git a/src/Parsers/ASTColumnsMatcher.cpp b/src/Parsers/ASTColumnsMatcher.cpp
index 191ca52c0e8..e9b2c4cc562 100644
--- a/src/Parsers/ASTColumnsMatcher.cpp
+++ b/src/Parsers/ASTColumnsMatcher.cpp
@@ -30,8 +30,12 @@ void ASTColumnsMatcher::updateTreeHashImpl(SipHash & hash_state) const
 
 void ASTColumnsMatcher::formatImpl(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const
 {
-    settings.ostr << (settings.hilite ? hilite_keyword : "") << "COLUMNS" << (settings.hilite ? hilite_none : "") << "("
-                  << quoteString(original_pattern) << ")";
+    settings.ostr << (settings.hilite ? hilite_keyword : "") << "COLUMNS" << (settings.hilite ? hilite_none : "") << "(";
+    if (column_list)
+        column_list->formatImpl(settings, state, frame);
+    else
+        settings.ostr << quoteString(original_pattern);
+    settings.ostr << ")";
     for (ASTs::const_iterator it = children.begin() + 1; it != children.end(); ++it)
     {
         settings.ostr << ' ';
diff --git a/src/Parsers/ASTColumnsMatcher.h b/src/Parsers/ASTColumnsMatcher.h
index 47a9b86a519..76ece9c95cc 100644
--- a/src/Parsers/ASTColumnsMatcher.h
+++ b/src/Parsers/ASTColumnsMatcher.h
@@ -36,6 +36,8 @@ public:
     bool isColumnMatching(const String & column_name) const;
     void updateTreeHashImpl(SipHash & hash_state) const override;
 
+    ASTPtr column_list;
+
 protected:
     void formatImpl(const FormatSettings & settings, FormatState &, FormatStateStacked) const override;
 
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 19b6ff487cc..1d861c6d78a 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -1188,6 +1188,7 @@ bool ParserAlias::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 bool ParserColumnsMatcher::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
     ParserKeyword columns("COLUMNS");
+    ParserList columns_p(std::make_unique<ParserCompoundIdentifier>(), std::make_unique<ParserToken>(TokenType::Comma), false);
     ParserStringLiteral regex;
 
     if (!columns.ignore(pos, expected))
@@ -1197,8 +1198,9 @@ bool ParserColumnsMatcher::parseImpl(Pos & pos, ASTPtr & node, Expected & expect
         return false;
     ++pos;
 
+    ASTPtr column_list;
     ASTPtr regex_node;
-    if (!regex.parse(pos, regex_node, expected))
+    if (!columns_p.parse(pos, column_list, expected) && !regex.parse(pos, regex_node, expected))
         return false;
 
     if (pos->type != TokenType::ClosingRoundBracket)
@@ -1206,8 +1208,17 @@ bool ParserColumnsMatcher::parseImpl(Pos & pos, ASTPtr & node, Expected & expect
     ++pos;
 
     auto res = std::make_shared<ASTColumnsMatcher>();
-    res->setPattern(regex_node->as<ASTLiteral &>().value.get<String>());
-    res->children.push_back(regex_node);
+    if (column_list)
+    {
+        res->column_list = column_list;
+        res->children.push_back(res->column_list);
+    }
+    else
+    {
+        res->setPattern(regex_node->as<ASTLiteral &>().value.get<String>());
+        res->children.push_back(regex_node);
+    }
+
     ParserColumnsTransformers transformers_p;
     ASTPtr transformer;
     while (transformers_p.parse(pos, transformer, expected))
diff --git a/tests/queries/0_stateless/01470_columns_transformers.reference b/tests/queries/0_stateless/01470_columns_transformers.reference
index c0f02e51ccf..ba23352c420 100644
--- a/tests/queries/0_stateless/01470_columns_transformers.reference
+++ b/tests/queries/0_stateless/01470_columns_transformers.reference
@@ -61,3 +61,9 @@ SELECT
     j,
     k
 FROM columns_transformers
+220	18	347
+SELECT
+    sum(i),
+    sum(j),
+    sum(k)
+FROM columns_transformers
diff --git a/tests/queries/0_stateless/01470_columns_transformers.sql b/tests/queries/0_stateless/01470_columns_transformers.sql
index de6a1a89d81..55335110c97 100644
--- a/tests/queries/0_stateless/01470_columns_transformers.sql
+++ b/tests/queries/0_stateless/01470_columns_transformers.sql
@@ -33,4 +33,8 @@ EXPLAIN SYNTAX SELECT a.* APPLY(toDate) REPLACE(i + 1 AS i) APPLY(any) from colu
 -- Multiple REPLACE in a row
 EXPLAIN SYNTAX SELECT * REPLACE(i + 1 AS i) REPLACE(i + 1 AS i) from columns_transformers;
 
+-- Explicit column list
+SELECT COLUMNS(i, j, k) APPLY(sum) from columns_transformers;
+EXPLAIN SYNTAX SELECT COLUMNS(i, j, k) APPLY(sum) from columns_transformers;
+
 DROP TABLE columns_transformers;

From e94b81460674008ade2dddfb60d27f6c7f7c9dc1 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 16:07:32 +0300
Subject: [PATCH 293/341] Update arrayConcat

---
 src/Functions/GatherUtils/GatherUtils.h |  2 +-
 src/Functions/GatherUtils/concat.cpp    | 33 ++++++++++++++++++-------
 src/Functions/array/arrayConcat.cpp     |  7 ++----
 3 files changed, 27 insertions(+), 15 deletions(-)

diff --git a/src/Functions/GatherUtils/GatherUtils.h b/src/Functions/GatherUtils/GatherUtils.h
index f383b9f4e7f..6c31898b202 100644
--- a/src/Functions/GatherUtils/GatherUtils.h
+++ b/src/Functions/GatherUtils/GatherUtils.h
@@ -41,7 +41,7 @@ std::unique_ptr<IArraySource> createArraySource(const ColumnArray & col, bool is
 std::unique_ptr<IValueSource> createValueSource(const IColumn & col, bool is_const, size_t total_rows);
 std::unique_ptr<IArraySink> createArraySink(ColumnArray & col, size_t column_size);
 
-void concat(const std::vector<std::unique_ptr<IArraySource>> & sources, IArraySink & sink);
+ColumnArray::MutablePtr concat(const std::vector<std::unique_ptr<IArraySource>> & sources);
 
 ColumnArray::MutablePtr sliceFromLeftConstantOffsetUnbounded(IArraySource & src, size_t offset);
 ColumnArray::MutablePtr sliceFromLeftConstantOffsetBounded(IArraySource & src, size_t offset, ssize_t length);
diff --git a/src/Functions/GatherUtils/concat.cpp b/src/Functions/GatherUtils/concat.cpp
index 0962baed603..e116052c637 100644
--- a/src/Functions/GatherUtils/concat.cpp
+++ b/src/Functions/GatherUtils/concat.cpp
@@ -16,37 +16,52 @@ namespace ErrorCodes
 namespace GatherUtils
 {
 
-struct ArrayConcat : public ArraySinkSourceSelector<ArrayConcat>
+struct ArrayConcat : public ArraySinkSelector<ArrayConcat>
 {
     using Sources = std::vector<std::unique_ptr<IArraySource>>;
 
-    template <typename Source, typename Sink>
-    static void selectSourceSink(Source &&, Sink && sink, const Sources & sources)
+    template <typename Source>
+    static void selectImpl(Source &&, const Sources & sources, ColumnArray::MutablePtr & result)
     {
         using SourceType = typename std::decay<Source>::type;
+        using Sink = typename SourceType::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
+
         concat<SourceType, Sink>(sources, sink);
     }
 
-    template <typename Source, typename Sink>
-    static void selectSourceSink(ConstSource<Source> &&, Sink && sink, const Sources & sources)
+    template <typename Source>
+    static void selectImpl(ConstSource<Source> &&, const Sources & sources, ColumnArray::MutablePtr & result)
     {
         using SourceType = typename std::decay<Source>::type;
+        using Sink = typename SourceType::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
+
         concat<SourceType, Sink>(sources, sink);
     }
 
-    template <typename Source, typename Sink>
-    static void selectSourceSink(ConstSource<Source> &, Sink && sink, const Sources & sources)
+    template <typename Source>
+    static void selectImpl(ConstSource<Source> &, const Sources & sources, ColumnArray::MutablePtr & result)
     {
         using SourceType = typename std::decay<Source>::type;
+        using Sink = typename SourceType::SinkType;
+        result = ColumnArray::create(source.createValuesColumn());
+        Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
+
         concat<SourceType, Sink>(sources, sink);
     }
 };
 
-void concat(const std::vector<std::unique_ptr<IArraySource>> & sources, IArraySink & sink)
+ColumnArray::MutablePtr concat(const std::vector<std::unique_ptr<IArraySource>> & sources)
 {
     if (sources.empty())
         throw Exception("Concat function should get at least 1 ArraySource", ErrorCodes::LOGICAL_ERROR);
-    return ArrayConcat::select(*sources.front(), sink, sources);
+
+    ColumnArray::MutablePtr res;
+    ArrayConcat::select(*sources.front(), sources, res);
+    return res;
 }
 
 }
diff --git a/src/Functions/array/arrayConcat.cpp b/src/Functions/array/arrayConcat.cpp
index 23e6c7a28a8..bea797c1979 100644
--- a/src/Functions/array/arrayConcat.cpp
+++ b/src/Functions/array/arrayConcat.cpp
@@ -59,8 +59,6 @@ public:
             return;
         }
 
-        auto result_column = return_type->createColumn();
-
         size_t rows = input_rows_count;
         size_t num_args = arguments.size();
 
@@ -95,10 +93,9 @@ public:
                 throw Exception{"Arguments for function " + getName() + " must be arrays.", ErrorCodes::LOGICAL_ERROR};
         }
 
-        auto sink = GatherUtils::createArraySink(typeid_cast<ColumnArray &>(*result_column), rows);
-        GatherUtils::concat(sources, *sink);
+        auto sink = GatherUtils::concat(sources);
 
-        block.getByPosition(result).column = std::move(result_column);
+        block.getByPosition(result).column = std::move(sink);
     }
 
     bool useDefaultImplementationForConstants() const override { return true; }

From d362ced0b58c2dfcfc18c440c59ce5ad71161d10 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 16:09:32 +0300
Subject: [PATCH 294/341] Update arrayConcat

---
 src/Functions/GatherUtils/concat.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/GatherUtils/concat.cpp b/src/Functions/GatherUtils/concat.cpp
index e116052c637..f0b789c2214 100644
--- a/src/Functions/GatherUtils/concat.cpp
+++ b/src/Functions/GatherUtils/concat.cpp
@@ -21,7 +21,7 @@ struct ArrayConcat : public ArraySinkSelector<ArrayConcat>
     using Sources = std::vector<std::unique_ptr<IArraySource>>;
 
     template <typename Source>
-    static void selectImpl(Source &&, const Sources & sources, ColumnArray::MutablePtr & result)
+    static void selectImpl(Source && source, const Sources & sources, ColumnArray::MutablePtr & result)
     {
         using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;
@@ -32,7 +32,7 @@ struct ArrayConcat : public ArraySinkSelector<ArrayConcat>
     }
 
     template <typename Source>
-    static void selectImpl(ConstSource<Source> &&, const Sources & sources, ColumnArray::MutablePtr & result)
+    static void selectImpl(ConstSource<Source> && source, const Sources & sources, ColumnArray::MutablePtr & result)
     {
         using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;
@@ -43,7 +43,7 @@ struct ArrayConcat : public ArraySinkSelector<ArrayConcat>
     }
 
     template <typename Source>
-    static void selectImpl(ConstSource<Source> &, const Sources & sources, ColumnArray::MutablePtr & result)
+    static void selectImpl(ConstSource<Source> & source, const Sources & sources, ColumnArray::MutablePtr & result)
     {
         using SourceType = typename std::decay<Source>::type;
         using Sink = typename SourceType::SinkType;

From 2a2e369c6eaad772d43f78e5273db570cf80a46b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 16:11:42 +0300
Subject: [PATCH 295/341] Update arrayConcat

---
 src/Functions/GatherUtils/concat.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/concat.cpp b/src/Functions/GatherUtils/concat.cpp
index f0b789c2214..c6e802e3961 100644
--- a/src/Functions/GatherUtils/concat.cpp
+++ b/src/Functions/GatherUtils/concat.cpp
@@ -16,7 +16,7 @@ namespace ErrorCodes
 namespace GatherUtils
 {
 
-struct ArrayConcat : public ArraySinkSelector<ArrayConcat>
+struct ArrayConcat : public ArraySourceSelector<ArrayConcat>
 {
     using Sources = std::vector<std::unique_ptr<IArraySource>>;
 

From 715b1a41ed15194211b959d3afb2831323a1629d Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 16:14:46 +0300
Subject: [PATCH 296/341] Update arrayConcat

---
 src/Functions/GatherUtils/concat.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/GatherUtils/concat.cpp b/src/Functions/GatherUtils/concat.cpp
index c6e802e3961..1329320938d 100644
--- a/src/Functions/GatherUtils/concat.cpp
+++ b/src/Functions/GatherUtils/concat.cpp
@@ -28,7 +28,7 @@ struct ArrayConcat : public ArraySourceSelector<ArrayConcat>
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
 
-        concat<SourceType, Sink>(sources, sink);
+        concat<SourceType, Sink>(sources, std::move(sink));
     }
 
     template <typename Source>
@@ -39,7 +39,7 @@ struct ArrayConcat : public ArraySourceSelector<ArrayConcat>
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
 
-        concat<SourceType, Sink>(sources, sink);
+        concat<SourceType, Sink>(sources, std::move(sink));
     }
 
     template <typename Source>
@@ -50,7 +50,7 @@ struct ArrayConcat : public ArraySourceSelector<ArrayConcat>
         result = ColumnArray::create(source.createValuesColumn());
         Sink sink(result->getData(), result->getOffsets(), source.getColumnSize());
 
-        concat<SourceType, Sink>(sources, sink);
+        concat<SourceType, Sink>(sources, std::move(sink));
     }
 };
 

From cbe85327e22d8a889b99b7f4c5eb97b00e07c879 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 16:24:07 +0300
Subject: [PATCH 297/341] Check stack size

---
 src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp b/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
index 147ac070efb..739dfedfde4 100644
--- a/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
+++ b/src/Storages/MergeTree/MergeTreeBlockReadUtils.cpp
@@ -1,5 +1,6 @@
 #include <Storages/MergeTree/MergeTreeBlockReadUtils.h>
 #include <Storages/MergeTree/MergeTreeData.h>
+#include <Common/checkStackSize.h>
 #include <Common/typeid_cast.h>
 #include <Columns/ColumnConst.h>
 #include <unordered_set>
@@ -28,6 +29,10 @@ bool injectRequiredColumnsRecursively(
     NameSet & required_columns,
     NameSet & injected_columns)
 {
+    /// This is needed to prevent stack overflow in case of cyclic defaults or
+    /// huge AST which for some reason was not validated on parsing/interpreter
+    /// stages.
+    checkStackSize();
     String column_name_in_part = column_name;
     if (alter_conversions.isColumnRenamed(column_name_in_part))
         column_name_in_part = alter_conversions.getColumnOldName(column_name_in_part);

From bc1031be9bf7239a66c7de6312fb5acca2aa4840 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 16:33:28 +0300
Subject: [PATCH 298/341] Split has.

---
 src/Functions/GatherUtils/GatherUtils.h  | 21 +++++++++++++-
 src/Functions/GatherUtils/has.cpp        | 35 ------------------------
 src/Functions/GatherUtils/has_all.cpp    | 23 ++++++++++++++++
 src/Functions/GatherUtils/has_any.cpp    | 23 ++++++++++++++++
 src/Functions/GatherUtils/has_substr.cpp | 23 ++++++++++++++++
 src/Functions/ya.make                    |  4 ++-
 6 files changed, 92 insertions(+), 37 deletions(-)
 delete mode 100644 src/Functions/GatherUtils/has.cpp
 create mode 100644 src/Functions/GatherUtils/has_all.cpp
 create mode 100644 src/Functions/GatherUtils/has_any.cpp
 create mode 100644 src/Functions/GatherUtils/has_substr.cpp

diff --git a/src/Functions/GatherUtils/GatherUtils.h b/src/Functions/GatherUtils/GatherUtils.h
index 6c31898b202..180ffb92026 100644
--- a/src/Functions/GatherUtils/GatherUtils.h
+++ b/src/Functions/GatherUtils/GatherUtils.h
@@ -52,7 +52,26 @@ ColumnArray::MutablePtr sliceFromRightConstantOffsetBounded(IArraySource & src,
 ColumnArray::MutablePtr sliceDynamicOffsetUnbounded(IArraySource & src, const IColumn & offset_column);
 ColumnArray::MutablePtr sliceDynamicOffsetBounded(IArraySource & src, const IColumn & offset_column, const IColumn & length_column);
 
-void sliceHas(IArraySource & first, IArraySource & second, ArraySearchType search_type, ColumnUInt8 & result);
+void sliceHasAny(IArraySource & first, IArraySource & second, ColumnUInt8 & result);
+void sliceHasAll(IArraySource & first, IArraySource & second, ColumnUInt8 & result);
+void sliceHasSubstr(IArraySource & first, IArraySource & second, ColumnUInt8 & result);
+
+void sliceHas(IArraySource & first, IArraySource & second, ArraySearchType search_type, ColumnUInt8 & result)
+{
+    switch (search_type)
+    {
+        case ArraySearchType::All:
+            sliceHasAny(first, second, result);
+            break;
+        case ArraySearchType::Any:
+            sliceHasAll(first, second, result);
+            break;
+        case ArraySearchType::Substr:
+            sliceHasSubstr(first, second, result);
+            break;
+
+    }
+}
 
 void push(IArraySource & array_source, IValueSource & value_source, IArraySink & sink, bool push_front);
 
diff --git a/src/Functions/GatherUtils/has.cpp b/src/Functions/GatherUtils/has.cpp
deleted file mode 100644
index d996a155e76..00000000000
--- a/src/Functions/GatherUtils/has.cpp
+++ /dev/null
@@ -1,35 +0,0 @@
-#include "GatherUtils.h"
-#include "Selectors.h"
-#include "Algorithms.h"
-
-namespace DB::GatherUtils
-{
-
-struct ArrayHasSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
-{
-    template <typename FirstSource, typename SecondSource>
-    static void selectSourcePair(FirstSource && first, SecondSource && second, ArraySearchType search_type, ColumnUInt8 & result)
-    {
-        switch (search_type)
-        {
-            case ArraySearchType::All:
-                arrayAllAny<ArraySearchType::All>(first, second, result);
-                break;
-            case ArraySearchType::Any:
-                arrayAllAny<ArraySearchType::Any>(first, second, result);
-                break;
-            case ArraySearchType::Substr:
-                arrayAllAny<ArraySearchType::Substr>(first, second, result);
-                break;
-
-        }
-    }
-};
-
-
-void sliceHas(IArraySource & first, IArraySource & second, ArraySearchType search_type, ColumnUInt8 & result)
-{
-    ArrayHasSelectArraySourcePair::select(first, second, search_type, result);
-}
-
-}
diff --git a/src/Functions/GatherUtils/has_all.cpp b/src/Functions/GatherUtils/has_all.cpp
new file mode 100644
index 00000000000..d99430e1c43
--- /dev/null
+++ b/src/Functions/GatherUtils/has_all.cpp
@@ -0,0 +1,23 @@
+#include "GatherUtils.h"
+#include "Selectors.h"
+#include "Algorithms.h"
+
+namespace DB::GatherUtils
+{
+
+struct ArrayHasAllSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
+{
+    template <typename FirstSource, typename SecondSource>
+    static void selectSourcePair(FirstSource && first, SecondSource && second, ArraySearchType search_type, ColumnUInt8 & result)
+    {
+        arrayAllAny<ArraySearchType::All>(first, second, result);
+    }
+};
+
+
+void sliceHasAll(IArraySource & first, IArraySource & second, ColumnUInt8 & result)
+{
+    ArrayHasAllSelectArraySourcePair::select(first, second, result);
+}
+
+}
diff --git a/src/Functions/GatherUtils/has_any.cpp b/src/Functions/GatherUtils/has_any.cpp
new file mode 100644
index 00000000000..b099d8d6785
--- /dev/null
+++ b/src/Functions/GatherUtils/has_any.cpp
@@ -0,0 +1,23 @@
+#include "GatherUtils.h"
+#include "Selectors.h"
+#include "Algorithms.h"
+
+namespace DB::GatherUtils
+{
+
+struct ArrayHasAnySelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
+{
+    template <typename FirstSource, typename SecondSource>
+    static void selectSourcePair(FirstSource && first, SecondSource && second, ArraySearchType search_type, ColumnUInt8 & result)
+    {
+        arrayAllAny<ArraySearchType::Any>(first, second, result);
+    }
+};
+
+
+void sliceHasAny(IArraySource & first, IArraySource & second, ColumnUInt8 & result)
+{
+    ArrayHasAnySelectArraySourcePair::select(first, second, result);
+}
+
+}
diff --git a/src/Functions/GatherUtils/has_substr.cpp b/src/Functions/GatherUtils/has_substr.cpp
new file mode 100644
index 00000000000..319c3da8b83
--- /dev/null
+++ b/src/Functions/GatherUtils/has_substr.cpp
@@ -0,0 +1,23 @@
+#include "GatherUtils.h"
+#include "Selectors.h"
+#include "Algorithms.h"
+
+namespace DB::GatherUtils
+{
+
+struct ArrayHasSubstrSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
+{
+    template <typename FirstSource, typename SecondSource>
+    static void selectSourcePair(FirstSource && first, SecondSource && second, ArraySearchType search_type, ColumnUInt8 & result)
+    {
+        arrayAllAny<ArraySearchType::Substr>(first, second, result);
+    }
+};
+
+
+void sliceHasSubstr(IArraySource & first, IArraySource & second, ColumnUInt8 & result)
+{
+    ArrayHasSubstrSelectArraySourcePair::select(first, second, result);
+}
+
+}
diff --git a/src/Functions/ya.make b/src/Functions/ya.make
index 388b140bf11..97847b99bf6 100644
--- a/src/Functions/ya.make
+++ b/src/Functions/ya.make
@@ -190,7 +190,9 @@ SRCS(
     GatherUtils/createArraySink.cpp
     GatherUtils/createArraySource.cpp
     GatherUtils/createValueSource.cpp
-    GatherUtils/has.cpp
+    GatherUtils/has_all.cpp
+    GatherUtils/has_any.cpp
+    GatherUtils/has_substr.cpp
     GatherUtils/push.cpp
     GatherUtils/resizeConstantSize.cpp
     GatherUtils/resizeDynamicSize.cpp

From 0eff356c38b38f17b47155ec1246ee39e182d78d Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 16:37:16 +0300
Subject: [PATCH 299/341] Split has.

---
 src/Functions/GatherUtils/has_all.cpp    | 2 +-
 src/Functions/GatherUtils/has_any.cpp    | 2 +-
 src/Functions/GatherUtils/has_substr.cpp | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/GatherUtils/has_all.cpp b/src/Functions/GatherUtils/has_all.cpp
index d99430e1c43..38c4e80e3a4 100644
--- a/src/Functions/GatherUtils/has_all.cpp
+++ b/src/Functions/GatherUtils/has_all.cpp
@@ -8,7 +8,7 @@ namespace DB::GatherUtils
 struct ArrayHasAllSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
-    static void selectSourcePair(FirstSource && first, SecondSource && second, ArraySearchType search_type, ColumnUInt8 & result)
+    static void selectSourcePair(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
     {
         arrayAllAny<ArraySearchType::All>(first, second, result);
     }
diff --git a/src/Functions/GatherUtils/has_any.cpp b/src/Functions/GatherUtils/has_any.cpp
index b099d8d6785..c0d84cf44d8 100644
--- a/src/Functions/GatherUtils/has_any.cpp
+++ b/src/Functions/GatherUtils/has_any.cpp
@@ -8,7 +8,7 @@ namespace DB::GatherUtils
 struct ArrayHasAnySelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
-    static void selectSourcePair(FirstSource && first, SecondSource && second, ArraySearchType search_type, ColumnUInt8 & result)
+    static void selectSourcePair(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
     {
         arrayAllAny<ArraySearchType::Any>(first, second, result);
     }
diff --git a/src/Functions/GatherUtils/has_substr.cpp b/src/Functions/GatherUtils/has_substr.cpp
index 319c3da8b83..871957ca9b4 100644
--- a/src/Functions/GatherUtils/has_substr.cpp
+++ b/src/Functions/GatherUtils/has_substr.cpp
@@ -8,7 +8,7 @@ namespace DB::GatherUtils
 struct ArrayHasSubstrSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
-    static void selectSourcePair(FirstSource && first, SecondSource && second, ArraySearchType search_type, ColumnUInt8 & result)
+    static void selectSourcePair(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
     {
         arrayAllAny<ArraySearchType::Substr>(first, second, result);
     }

From ec6390231a485f62cbbe414950082076536018a9 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 16:43:36 +0300
Subject: [PATCH 300/341] Split has.

---
 src/Functions/GatherUtils/has_all.cpp    | 2 +-
 src/Functions/GatherUtils/has_any.cpp    | 2 +-
 src/Functions/GatherUtils/has_substr.cpp | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/GatherUtils/has_all.cpp b/src/Functions/GatherUtils/has_all.cpp
index 38c4e80e3a4..ae2e6c7af42 100644
--- a/src/Functions/GatherUtils/has_all.cpp
+++ b/src/Functions/GatherUtils/has_all.cpp
@@ -5,7 +5,7 @@
 namespace DB::GatherUtils
 {
 
-struct ArrayHasAllSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
+struct ArrayHasAllSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasAllSelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
     static void selectSourcePair(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
diff --git a/src/Functions/GatherUtils/has_any.cpp b/src/Functions/GatherUtils/has_any.cpp
index c0d84cf44d8..a25acdd666a 100644
--- a/src/Functions/GatherUtils/has_any.cpp
+++ b/src/Functions/GatherUtils/has_any.cpp
@@ -5,7 +5,7 @@
 namespace DB::GatherUtils
 {
 
-struct ArrayHasAnySelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
+struct ArrayHasAnySelectArraySourcePair : public ArraySourcePairSelector<ArrayHasAnySelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
     static void selectSourcePair(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
diff --git a/src/Functions/GatherUtils/has_substr.cpp b/src/Functions/GatherUtils/has_substr.cpp
index 871957ca9b4..27c15c5b786 100644
--- a/src/Functions/GatherUtils/has_substr.cpp
+++ b/src/Functions/GatherUtils/has_substr.cpp
@@ -5,7 +5,7 @@
 namespace DB::GatherUtils
 {
 
-struct ArrayHasSubstrSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSelectArraySourcePair>
+struct ArrayHasSubstrSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSubstrSelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
     static void selectSourcePair(FirstSource && first, SecondSource && second, ColumnUInt8 & result)

From 9a6b4b3355576e1e71c2a449a3cc53dd7912fb83 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 16:49:09 +0300
Subject: [PATCH 301/341] Split has.

---
 src/Functions/GatherUtils/GatherUtils.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/GatherUtils.h b/src/Functions/GatherUtils/GatherUtils.h
index 180ffb92026..7089be688d7 100644
--- a/src/Functions/GatherUtils/GatherUtils.h
+++ b/src/Functions/GatherUtils/GatherUtils.h
@@ -56,7 +56,7 @@ void sliceHasAny(IArraySource & first, IArraySource & second, ColumnUInt8 & resu
 void sliceHasAll(IArraySource & first, IArraySource & second, ColumnUInt8 & result);
 void sliceHasSubstr(IArraySource & first, IArraySource & second, ColumnUInt8 & result);
 
-void sliceHas(IArraySource & first, IArraySource & second, ArraySearchType search_type, ColumnUInt8 & result)
+inline void sliceHas(IArraySource & first, IArraySource & second, ArraySearchType search_type, ColumnUInt8 & result)
 {
     switch (search_type)
     {

From 17ec88da849ba762f21454311109e091aef88d97 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 17:02:28 +0300
Subject: [PATCH 302/341] Split has.

---
 src/Functions/GatherUtils/GatherUtils.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/GatherUtils/GatherUtils.h b/src/Functions/GatherUtils/GatherUtils.h
index 7089be688d7..c2513214a79 100644
--- a/src/Functions/GatherUtils/GatherUtils.h
+++ b/src/Functions/GatherUtils/GatherUtils.h
@@ -61,10 +61,10 @@ inline void sliceHas(IArraySource & first, IArraySource & second, ArraySearchTyp
     switch (search_type)
     {
         case ArraySearchType::All:
-            sliceHasAny(first, second, result);
+            sliceHasAll(first, second, result);
             break;
         case ArraySearchType::Any:
-            sliceHasAll(first, second, result);
+            sliceHasAny(first, second, result);
             break;
         case ArraySearchType::Substr:
             sliceHasSubstr(first, second, result);

From c41e230589199fc9a7976fe9a1e53a6d083b2152 Mon Sep 17 00:00:00 2001
From: Simon Liu <331435+monadbobo@users.noreply.github.com>
Date: Wed, 16 Sep 2020 22:14:30 +0800
Subject: [PATCH 303/341] Modify the minimum version of the Clang compiler that
 Clickhouse can support (8 -> 9), The main reason is that in Clang 8.0
 "#pragma clang attribute" cannot be used in the namesapce scope.

---
 cmake/tools.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmake/tools.cmake b/cmake/tools.cmake
index a6ea573a59d..723a14c6584 100644
--- a/cmake/tools.cmake
+++ b/cmake/tools.cmake
@@ -28,7 +28,7 @@ elseif (COMPILER_CLANG)
             set (CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -fchar8_t")
         endif ()
     else ()
-        set (CLANG_MINIMUM_VERSION 8)
+        set (CLANG_MINIMUM_VERSION 9)
         if (CMAKE_CXX_COMPILER_VERSION VERSION_LESS ${CLANG_MINIMUM_VERSION})
             message (FATAL_ERROR "Clang version must be at least ${CLANG_MINIMUM_VERSION}.")
         endif ()

From 96a202c0fb301eec4a176366e5aa1e361b5f3227 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Wed, 16 Sep 2020 17:57:26 +0800
Subject: [PATCH 304/341] Get rid of query settings after initialization.

---
 src/Storages/StorageDistributed.cpp | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 703bb6dcb96..78f7af3b7d9 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -99,6 +99,12 @@ ASTPtr rewriteSelectQuery(const ASTPtr & query, const std::string & database, co
     auto modified_query_ast = query->clone();
 
     ASTSelectQuery & select_query = modified_query_ast->as<ASTSelectQuery &>();
+
+    // Get rid of the settings clause so we don't send them to remote. Thus newly non-important
+    // settings won't break any remote parser. It's also more reasonable since the query settings
+    // are written into the query context and will be sent by the query pipeline.
+    select_query.setExpression(ASTSelectQuery::Expression::SETTINGS, {});
+
     if (table_function_ptr)
         select_query.addTableFunction(table_function_ptr);
     else

From 42c543a64d77434d431fc5d7b43fd17c08e09986 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 17:58:54 +0300
Subject: [PATCH 305/341] Fix GenericSource

---
 src/Functions/GatherUtils/Sources.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index cc7f2b662b6..2795b7ac4ed 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -573,7 +573,7 @@ struct GenericArraySource : public ArraySourceImpl<GenericArraySource>
 
     size_t getSizeForReserve() const override
     {
-        return elements.size();
+        return offsets.size();
     }
 
     size_t getColumnSize() const override

From 8fed50b1dbf9fad762d3fea45ed88e7529445d43 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 18:03:47 +0300
Subject: [PATCH 306/341] Fix GenericSource

---
 src/Functions/GatherUtils/Sources.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 2795b7ac4ed..6caeb1a41c9 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -573,12 +573,12 @@ struct GenericArraySource : public ArraySourceImpl<GenericArraySource>
 
     size_t getSizeForReserve() const override
     {
-        return offsets.size();
+        return elements.size();
     }
 
     size_t getColumnSize() const override
     {
-        return elements.size();
+        return offsets.size();
     }
 
     size_t getElementSize() const

From faa5190f11219137523623df5153fe937ee95b38 Mon Sep 17 00:00:00 2001
From: tavplubix <avtokmakov@yandex-team.ru>
Date: Wed, 16 Sep 2020 18:17:16 +0300
Subject: [PATCH 307/341] Update arcadia_skip_list.txt

---
 tests/queries/0_stateless/arcadia_skip_list.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/arcadia_skip_list.txt b/tests/queries/0_stateless/arcadia_skip_list.txt
index aa8a9f48ce9..123b4c3d144 100644
--- a/tests/queries/0_stateless/arcadia_skip_list.txt
+++ b/tests/queries/0_stateless/arcadia_skip_list.txt
@@ -142,3 +142,4 @@
 01474_executable_dictionary
 01474_bad_global_join
 01473_event_time_microseconds
+01461_query_start_time_microseconds

From 348125c22606c9992420d567c8f9d95417d86d87 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 16 Sep 2020 18:19:32 +0300
Subject: [PATCH 308/341] Bump CI


From 0f8aec59a3346d305c8ffd9bb2d96f60fc6823a8 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Wed, 16 Sep 2020 18:27:51 +0300
Subject: [PATCH 309/341] Adjust ignore thresholds for unstable perf tests

Based on historical data.

```
SELECT
    test,
    ceil(max(q[3]), 1) AS h
FROM
(
    SELECT
        test,
        query_index,
        count(*),
        min(event_time),
        max(event_time) AS t,
        arrayMap(x -> floor(x, 3), quantiles(0, 0.5, 0.95, 1)(stat_threshold)) AS q,
        median(stat_threshold) AS m
    FROM perftest.query_metrics
    WHERE (metric = 'client_time') AND (abs(diff) < 0.05)
    GROUP BY
        test,
        query_index,
        query_display_name
    HAVING (t > '2020-09-01 00:00:00') AND (m > 0.1)
    ORDER BY m DESC
)
GROUP BY test
ORDER BY h DESC
FORMAT TSV

cryptographic_hashes	1.3
collations	0.8
joins_in_memory_pmj	0.8
joins_in_memory	0.7
merge_tree_simple_select	0.7
set_index	0.7
decimal_casts	0.7
website	0.6
logical_functions_medium	0.5
count	0.5
merge_tree_many_partitions	0.5
decimal_aggregates	0.5
codecs_int_insert	0.5
column_column_comparison	0.5
insert_parallel	0.4
parse_engine_file	0.4
read_in_order_many_parts	0.4
logical_functions_small	0.4
parallel_insert	0.3
parallel_index	0.3
push_down_limit	0.3
jit_large_requests	0.3
select_format	0.3
arithmetic	0.3
merge_tree_huge_pk	0.3
materialized_view_parallel_insert	0.3
columns_hashing	0.3
if_array_string	0.3
random_string	0.2
random_printable_ascii	0.2
set	0.2
empty_string_serialization	0.2
```

To apply:
```
sed 's/^\(.*\)        \(.*\)$/sed -i "s\/^<test.*$\/<test max_ignored_relative_change="'"'"\2">\/g" tests\/performance\/\1.xml/g' ../bad.tsv | bash
```
---
 tests/performance/codecs_int_insert.xml                 | 2 +-
 tests/performance/collations.xml                        | 2 +-
 tests/performance/column_column_comparison.xml          | 2 +-
 tests/performance/columns_hashing.xml                   | 2 +-
 tests/performance/count.xml                             | 2 +-
 tests/performance/cryptographic_hashes.xml              | 2 +-
 tests/performance/decimal_aggregates.xml                | 2 +-
 tests/performance/empty_string_serialization.xml        | 2 +-
 tests/performance/if_array_string.xml                   | 2 +-
 tests/performance/insert_parallel.xml                   | 2 +-
 tests/performance/jit_large_requests.xml                | 2 +-
 tests/performance/joins_in_memory.xml                   | 2 +-
 tests/performance/logical_functions_medium.xml          | 2 +-
 tests/performance/materialized_view_parallel_insert.xml | 2 +-
 tests/performance/merge_tree_huge_pk.xml                | 2 +-
 tests/performance/merge_tree_many_partitions.xml        | 2 +-
 tests/performance/merge_tree_simple_select.xml          | 2 +-
 tests/performance/parallel_index.xml                    | 2 +-
 tests/performance/parallel_insert.xml                   | 2 +-
 tests/performance/parse_engine_file.xml                 | 2 +-
 tests/performance/push_down_limit.xml                   | 2 +-
 tests/performance/random_printable_ascii.xml            | 2 +-
 tests/performance/random_string.xml                     | 2 +-
 tests/performance/read_in_order_many_parts.xml          | 2 +-
 tests/performance/select_format.xml                     | 2 +-
 tests/performance/set.xml                               | 2 +-
 tests/performance/set_index.xml                         | 2 +-
 tests/performance/website.xml                           | 2 +-
 28 files changed, 28 insertions(+), 28 deletions(-)

diff --git a/tests/performance/codecs_int_insert.xml b/tests/performance/codecs_int_insert.xml
index 662df80ae70..0f2560b7134 100644
--- a/tests/performance/codecs_int_insert.xml
+++ b/tests/performance/codecs_int_insert.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.2">
+<test max_ignored_relative_change="0.5">
     <settings>
         <allow_suspicious_codecs>1</allow_suspicious_codecs>
     </settings>
diff --git a/tests/performance/collations.xml b/tests/performance/collations.xml
index 17b2d36b7e3..40153a48d07 100644
--- a/tests/performance/collations.xml
+++ b/tests/performance/collations.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.8">
 
 
diff --git a/tests/performance/column_column_comparison.xml b/tests/performance/column_column_comparison.xml
index 2b59a65a54b..dd77ba24043 100644
--- a/tests/performance/column_column_comparison.xml
+++ b/tests/performance/column_column_comparison.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.5">
     <tags>
         <tag>comparison</tag>
     </tags>
diff --git a/tests/performance/columns_hashing.xml b/tests/performance/columns_hashing.xml
index ac3d4b1b33b..fb340c20ccd 100644
--- a/tests/performance/columns_hashing.xml
+++ b/tests/performance/columns_hashing.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <tags>
         <tag>columns_hashing</tag>
     </tags>
diff --git a/tests/performance/count.xml b/tests/performance/count.xml
index b75fd4e4df5..4b8b00f48db 100644
--- a/tests/performance/count.xml
+++ b/tests/performance/count.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.5">
     <create_query>CREATE TABLE data(k UInt64, v UInt64) ENGINE = MergeTree ORDER BY k</create_query>
 
     <fill_query>INSERT INTO data SELECT number, 1 from numbers(10000000)</fill_query>
diff --git a/tests/performance/cryptographic_hashes.xml b/tests/performance/cryptographic_hashes.xml
index 03d275a7bb7..97359d4ba97 100644
--- a/tests/performance/cryptographic_hashes.xml
+++ b/tests/performance/cryptographic_hashes.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="1.0">
+<test max_ignored_relative_change="1.3">
     <substitutions>
         <substitution>
            <name>hash_slow</name>
diff --git a/tests/performance/decimal_aggregates.xml b/tests/performance/decimal_aggregates.xml
index 142d9388404..615c3201843 100644
--- a/tests/performance/decimal_aggregates.xml
+++ b/tests/performance/decimal_aggregates.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.4">
+<test max_ignored_relative_change="0.5">
     <settings>
         <max_memory_usage>35G</max_memory_usage>
     </settings>
diff --git a/tests/performance/empty_string_serialization.xml b/tests/performance/empty_string_serialization.xml
index 303283f08c7..d82bcf998aa 100644
--- a/tests/performance/empty_string_serialization.xml
+++ b/tests/performance/empty_string_serialization.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.2">
 
 
     <!-- gcc-8 generates 20% faster code than gcc-9
diff --git a/tests/performance/if_array_string.xml b/tests/performance/if_array_string.xml
index 5d33bfda51f..773509e1c4b 100644
--- a/tests/performance/if_array_string.xml
+++ b/tests/performance/if_array_string.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.2">
+<test max_ignored_relative_change="0.3">
     <query>SELECT count() FROM zeros(10000000) WHERE NOT ignore(rand() % 2 ? ['Hello', 'World'] : ['a', 'b', 'c'])</query>
     <query>SELECT count() FROM zeros(10000000) WHERE NOT ignore(rand() % 2 ? materialize(['Hello', 'World']) : ['a', 'b', 'c'])</query>
     <query>SELECT count() FROM zeros(10000000) WHERE NOT ignore(rand() % 2 ? ['Hello', 'World'] : materialize(['a', 'b', 'c']))</query>
diff --git a/tests/performance/insert_parallel.xml b/tests/performance/insert_parallel.xml
index 4ae50dce29a..4c0e3f03e58 100644
--- a/tests/performance/insert_parallel.xml
+++ b/tests/performance/insert_parallel.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.4">
     <settings>
         <max_insert_threads>4</max_insert_threads>
     </settings>
diff --git a/tests/performance/jit_large_requests.xml b/tests/performance/jit_large_requests.xml
index 6aed7bea544..46328b64af2 100644
--- a/tests/performance/jit_large_requests.xml
+++ b/tests/performance/jit_large_requests.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <create_query>
         CREATE TABLE jit_test (
             a UInt64,
diff --git a/tests/performance/joins_in_memory.xml b/tests/performance/joins_in_memory.xml
index fac6f2659c6..ccb4f5d0e20 100644
--- a/tests/performance/joins_in_memory.xml
+++ b/tests/performance/joins_in_memory.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.2">
+<test max_ignored_relative_change="0.7">
     <create_query>CREATE TABLE ints (i64 Int64, i32 Int32, i16 Int16, i8 Int8) ENGINE = Memory</create_query>
 
     <fill_query>INSERT INTO ints SELECT number AS i64, i64 AS i32, i64 AS i16, i64 AS i8 FROM numbers(10000)</fill_query>
diff --git a/tests/performance/logical_functions_medium.xml b/tests/performance/logical_functions_medium.xml
index 0ea4023a275..5e0dbd9b852 100644
--- a/tests/performance/logical_functions_medium.xml
+++ b/tests/performance/logical_functions_medium.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.4">
+<test max_ignored_relative_change="0.5">
     <settings>
         <max_threads>1</max_threads>
     </settings>
diff --git a/tests/performance/materialized_view_parallel_insert.xml b/tests/performance/materialized_view_parallel_insert.xml
index 4b71354dec3..1a34f71e7e6 100644
--- a/tests/performance/materialized_view_parallel_insert.xml
+++ b/tests/performance/materialized_view_parallel_insert.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <preconditions>
         <table_exists>hits_10m_single</table_exists>
     </preconditions>
diff --git a/tests/performance/merge_tree_huge_pk.xml b/tests/performance/merge_tree_huge_pk.xml
index 84e9ef2e41b..f4012315dbe 100644
--- a/tests/performance/merge_tree_huge_pk.xml
+++ b/tests/performance/merge_tree_huge_pk.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <create_query>
         CREATE TABLE huge_pk ENGINE = MergeTree ORDER BY (
         c001, c002, c003, c004, c005, c006, c007, c008, c009, c010, c011, c012, c013, c014, c015, c016, c017, c018, c019, c020, 
diff --git a/tests/performance/merge_tree_many_partitions.xml b/tests/performance/merge_tree_many_partitions.xml
index 2a8a52943a3..0d640d242ae 100644
--- a/tests/performance/merge_tree_many_partitions.xml
+++ b/tests/performance/merge_tree_many_partitions.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.5">
     <create_query>CREATE TABLE bad_partitions (x UInt64) ENGINE = MergeTree PARTITION BY x ORDER BY x</create_query>
     <fill_query>INSERT INTO bad_partitions SELECT * FROM numbers(10000)</fill_query>
 
diff --git a/tests/performance/merge_tree_simple_select.xml b/tests/performance/merge_tree_simple_select.xml
index 624e924f59a..93c1e5a3f33 100644
--- a/tests/performance/merge_tree_simple_select.xml
+++ b/tests/performance/merge_tree_simple_select.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.7">
     <create_query>CREATE TABLE simple_mergetree (EventDate Date, x UInt64) ENGINE = MergeTree ORDER BY x</create_query>
     <fill_query>INSERT INTO simple_mergetree SELECT number, today() + intDiv(number, 10000000) FROM numbers_mt(100000000)</fill_query>
     <fill_query>OPTIMIZE TABLE simple_mergetree FINAL</fill_query>
diff --git a/tests/performance/parallel_index.xml b/tests/performance/parallel_index.xml
index 033e47ee8ee..5a8e4a405cc 100644
--- a/tests/performance/parallel_index.xml
+++ b/tests/performance/parallel_index.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <create_query>create table test_parallel_index (x UInt64, y UInt64, z UInt64, INDEX a (y) TYPE minmax GRANULARITY 2,
         INDEX b (z) TYPE set(8) GRANULARITY 2) engine = MergeTree order by x partition by bitAnd(x, 63 * 64) settings index_granularity = 4;</create_query>
 
diff --git a/tests/performance/parallel_insert.xml b/tests/performance/parallel_insert.xml
index 4050e771cb8..b17d0f8bd64 100644
--- a/tests/performance/parallel_insert.xml
+++ b/tests/performance/parallel_insert.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
 
     <preconditions>
         <table_exists>hits_10m_single</table_exists>
diff --git a/tests/performance/parse_engine_file.xml b/tests/performance/parse_engine_file.xml
index 3cc177ad7e1..dacd73f5364 100644
--- a/tests/performance/parse_engine_file.xml
+++ b/tests/performance/parse_engine_file.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.2">
+<test max_ignored_relative_change="0.4">
     
     <create_query>CREATE TABLE IF NOT EXISTS table_{format} ENGINE = File({format}) AS test.hits</create_query>
 
diff --git a/tests/performance/push_down_limit.xml b/tests/performance/push_down_limit.xml
index 0dcd9335a52..02cce9539e9 100644
--- a/tests/performance/push_down_limit.xml
+++ b/tests/performance/push_down_limit.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <query>select number from (select number from numbers(10000000) order by -number) limit 10</query>
     <query>select number from (select number from numbers_mt(100000000) order by -number) limit 10</query>
 </test>
diff --git a/tests/performance/random_printable_ascii.xml b/tests/performance/random_printable_ascii.xml
index a55779f748d..97cadef24c2 100644
--- a/tests/performance/random_printable_ascii.xml
+++ b/tests/performance/random_printable_ascii.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.2">
     <query>SELECT count() FROM zeros(10000000) WHERE NOT ignore(randomPrintableASCII(10))</query>
     <query>SELECT count() FROM zeros(10000000) WHERE NOT ignore(randomPrintableASCII(100))</query>
     <query>SELECT count() FROM zeros(100000) WHERE NOT ignore(randomPrintableASCII(1000))</query>
diff --git a/tests/performance/random_string.xml b/tests/performance/random_string.xml
index 13ea35ebaba..3b714187be3 100644
--- a/tests/performance/random_string.xml
+++ b/tests/performance/random_string.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.2">
     <query>SELECT count() FROM zeros(10000000) WHERE NOT ignore(randomString(10))</query>
     <query>SELECT count() FROM zeros(10000000) WHERE NOT ignore(randomString(100))</query>
     <query>SELECT count() FROM zeros(100000) WHERE NOT ignore(randomString(1000))</query>
diff --git a/tests/performance/read_in_order_many_parts.xml b/tests/performance/read_in_order_many_parts.xml
index b45655a6f21..5329c45bfdd 100644
--- a/tests/performance/read_in_order_many_parts.xml
+++ b/tests/performance/read_in_order_many_parts.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.4">
     <settings>
         <optimize_aggregation_in_order>1</optimize_aggregation_in_order>
         <optimize_read_in_order>1</optimize_read_in_order>
diff --git a/tests/performance/select_format.xml b/tests/performance/select_format.xml
index bbe489c06c6..5f9c2e3f73b 100644
--- a/tests/performance/select_format.xml
+++ b/tests/performance/select_format.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.2">
+<test max_ignored_relative_change="0.3">
     <settings>
         <output_format_pretty_max_rows>1000000</output_format_pretty_max_rows>
         <max_threads>1</max_threads>
diff --git a/tests/performance/set.xml b/tests/performance/set.xml
index cbbff1f5bb2..be39cac77e1 100644
--- a/tests/performance/set.xml
+++ b/tests/performance/set.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.2">
     <substitutions>
        <substitution>
            <name>table_small</name>
diff --git a/tests/performance/set_index.xml b/tests/performance/set_index.xml
index 76f1087a1bf..657d831f3ee 100644
--- a/tests/performance/set_index.xml
+++ b/tests/performance/set_index.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.7">
     <create_query>CREATE TABLE test_in (`a` UInt32) ENGINE = MergeTree() ORDER BY a</create_query>
     <fill_query>INSERT INTO test_in SELECT number FROM numbers(500000000)</fill_query>
 
diff --git a/tests/performance/website.xml b/tests/performance/website.xml
index 1e10314ffdb..561b769bcde 100644
--- a/tests/performance/website.xml
+++ b/tests/performance/website.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.2">
+<test max_ignored_relative_change="0.6">
 
     <preconditions>
         <table_exists>hits_10m_single</table_exists>

From dda88eebd11298237894b253523c7d070e53162f Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <36882414+akuzm@users.noreply.github.com>
Date: Wed, 16 Sep 2020 18:35:27 +0300
Subject: [PATCH 310/341] test again

---
 docker/test/performance-comparison/compare.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/performance-comparison/compare.sh b/docker/test/performance-comparison/compare.sh
index 18e5bea4db5..8d7947b46a5 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/docker/test/performance-comparison/compare.sh
@@ -63,7 +63,7 @@ function configure
     # Make copies of the original db for both servers. Use hardlinks instead
     # of copying to save space. Before that, remove preprocessed configs and
     # system tables, because sharing them between servers with hardlinks may
-    # lead to weird effects.
+    # lead to weird effects. 
     rm -r left/db ||:
     rm -r right/db ||:
     rm -r db0/preprocessed_configs ||:

From 26eb49b48d7a8264de2ae51e30c6503abf5f04bf Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 16 Sep 2020 20:02:50 +0300
Subject: [PATCH 311/341] Fix typo

---
 src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.cpp
index a06feca4033..1ea40989dfc 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeBlockOutputStream.cpp
@@ -340,7 +340,7 @@ void ReplicatedMergeTreeBlockOutputStream::commitPart(
 
         if (multi_code == Coordination::Error::ZNODEEXISTS && deduplicate_block && failed_op_path == block_id_path)
         {
-            /// Block with the same id have just appeared in table (or other replica), rollback thee insertion.
+            /// Block with the same id have just appeared in table (or other replica), rollback the insertion.
             LOG_INFO(log, "Block with ID {} already exists; ignoring it (removing part {})", block_id, part->name);
 
             part->is_duplicate = true;

From 9fc594a4c588252ccf4d4e4de9ff56a8029a65b5 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 16 Sep 2020 20:32:56 +0300
Subject: [PATCH 312/341] Fix tests.

---
 src/Functions/GatherUtils/Sources.h | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 6caeb1a41c9..0cf37d159a8 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -642,6 +642,11 @@ struct NullableArraySource : public ArraySource
     {
     }
 
+    MutableColumnPtr createValuesColumn()
+    {
+        return ColumnNullable::create(static_cast<ArraySource *>(this)->createValuesColumn(), ColumnUInt8::create());
+    }
+
     void accept(ArraySourceVisitor & visitor) override { visitor.visit(*this); }
 
     Slice getWhole() const

From 4a094491f25456bc2902a75cd7c47b45faff5117 Mon Sep 17 00:00:00 2001
From: damozhaeva <68770561+damozhaeva@users.noreply.github.com>
Date: Wed, 16 Sep 2020 22:54:55 +0400
Subject: [PATCH 313/341] DOCSUP-2038 Edit and translate to Russian (#14236)

* Editing and translation.

* Editing and translation v2.

* Update docs/ru/getting-started/playground.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

* Update docs/ru/getting-started/playground.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

* Update docs/ru/getting-started/playground.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

* Update docs/ru/getting-started/playground.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

* Update docs/ru/getting-started/playground.md

Co-authored-by: BayoNet <da-daos@yandex.ru>

* Russian changes.

* Changed links.

* Update docs/ru/getting-started/playground.md

Co-authored-by: Ivan Blinkov <github@blinkov.ru>

* Update docs/ru/getting-started/playground.md

Co-authored-by: Ivan Blinkov <github@blinkov.ru>

* Changed odbc link

Co-authored-by: Sergei Shtykov <bayonet@yandex-team.ru>
Co-authored-by: emironyuk <em@don.ru>
Co-authored-by: Daria Mozhaeva <dmozhaeva@yandex-team.ru>
Co-authored-by: BayoNet <da-daos@yandex.ru>
Co-authored-by: Ivan Blinkov <github@blinkov.ru>
---
 docs/en/getting-started/playground.md |  8 +--
 docs/ru/getting-started/playground.md | 73 +++++++++++++++++----------
 2 files changed, 51 insertions(+), 30 deletions(-)

diff --git a/docs/en/getting-started/playground.md b/docs/en/getting-started/playground.md
index 7dd49e7d9ad..26fb105099b 100644
--- a/docs/en/getting-started/playground.md
+++ b/docs/en/getting-started/playground.md
@@ -6,11 +6,11 @@ toc_title: Playground
 # ClickHouse Playground {#clickhouse-playground}
 
 [ClickHouse Playground](https://play.clickhouse.tech) allows people to experiment with ClickHouse by running queries instantly, without setting up their server or cluster.
-Several example datasets are available in the Playground as well as sample queries that show ClickHouse features. There’s also a selection of ClickHouse LTS releases to experiment with.
+Several example datasets are available in Playground as well as sample queries that show ClickHouse features. There’s also a selection of ClickHouse LTS releases to experiment with.
 
 ClickHouse Playground gives the experience of m2.small [Managed Service for ClickHouse](https://cloud.yandex.com/services/managed-clickhouse) instance (4 vCPU, 32 GB RAM) hosted in [Yandex.Cloud](https://cloud.yandex.com/). More information about [cloud providers](../commercial/cloud.md).
 
-You can make queries to playground using any HTTP client, for example [curl](https://curl.haxx.se) or [wget](https://www.gnu.org/software/wget/), or set up a connection using [JDBC](../interfaces/jdbc.md) or [ODBC](../interfaces/odbc.md) drivers. More information about software products that support ClickHouse is available [here](../interfaces/index.md).
+You can make queries to Playground using any HTTP client, for example [curl](https://curl.haxx.se) or [wget](https://www.gnu.org/software/wget/), or set up a connection using [JDBC](../interfaces/jdbc.md) or [ODBC](../interfaces/odbc.md) drivers. More information about software products that support ClickHouse is available [here](../interfaces/index.md).
 
 ## Credentials {#credentials}
 
@@ -60,7 +60,7 @@ clickhouse client --secure -h play-api.clickhouse.tech --port 9440 -u playground
 ## Implementation Details {#implementation-details}
 
 ClickHouse Playground web interface makes requests via ClickHouse [HTTP API](../interfaces/http.md).
-The Playground backend is just a ClickHouse cluster without any additional server-side application. As mentioned above, ClickHouse HTTPS and TCP/TLS endpoints are also publicly available as a part of the Playground, both are proxied through [Cloudflare Spectrum](https://www.cloudflare.com/products/cloudflare-spectrum/) to add extra layer of protection and improved global connectivity.
+The Playground backend is just a ClickHouse cluster without any additional server-side application. As mentioned above, ClickHouse HTTPS and TCP/TLS endpoints are also publicly available as a part of the Playground, both are proxied through [Cloudflare Spectrum](https://www.cloudflare.com/products/cloudflare-spectrum/) to add an extra layer of protection and improved global connectivity.
 
 !!! warning "Warning"
-    Exposing ClickHouse server to public internet in any other situation is **strongly not recommended**. Make sure it listens only on private network and is covered by properly configured firewall.
+    Exposing the ClickHouse server to the public internet in any other situation is **strongly not recommended**. Make sure it listens only on a private network and is covered by a properly configured firewall.
diff --git a/docs/ru/getting-started/playground.md b/docs/ru/getting-started/playground.md
index 3ddd066b2ed..5cb0612dfc7 100644
--- a/docs/ru/getting-started/playground.md
+++ b/docs/ru/getting-started/playground.md
@@ -1,38 +1,59 @@
 # ClickHouse Playground {#clickhouse-playground}
 
-ClickHouse Playground позволяет моментально выполнить запросы к ClickHouse из бразуера.
-В Playground доступны несколько тестовых массивов данных и примеры запросов, которые показывают некоторые отличительные черты ClickHouse.
+[ClickHouse Playground](https://play.clickhouse.tech) позволяет пользователям экспериментировать с ClickHouse, мгновенно выполняя запросы без настройки своего сервера или кластера.
+В Playground доступны несколько тестовых массивов данных, а также примеры запросов, которые показывают возможности ClickHouse. Кроме того, вы можете выбрать LTS релиз ClickHouse, который хотите протестировать.
 
-Запросы выполняются под пользователем с правами `readonly` для которого есть следующие ограничения:
+ClickHouse Playground дает возможность поработать с  [Managed Service for ClickHouse](https://cloud.yandex.com/services/managed-clickhouse) в конфигурации m2.small (4 vCPU, 32 ГБ ОЗУ), которую предосталяет [Яндекс.Облако](https://cloud.yandex.com/). Дополнительную информацию об облачных провайдерах читайте в разделе [Поставщики облачных услуг ClickHouse](../commercial/cloud.md).
+
+Вы можете отправлять запросы к Playground с помощью любого HTTP-клиента, например [curl](https://curl.haxx.se) или [wget](https://www.gnu.org/software/wget/), также можно установить соединение с помощью драйверов [JDBC](../interfaces/jdbc.md) или [ODBC](../interfaces/odbc.md). Более подробная информация о программных продуктах, поддерживающих ClickHouse, доступна [здесь](../interfaces/index.md).
+
+## Параметры доступа {#credentials}
+
+| Параметр            | Значение                                |
+|:--------------------|:----------------------------------------|
+| Конечная точка HTTPS| `https://play-api.clickhouse.tech:8443` |
+| Конечная точка TCP  | `play-api.clickhouse.tech:9440`         |
+| Пользователь        | `playground`                            |
+| Пароль              | `clickhouse`                            |
+
+Также можно подключаться к ClickHouse определённых релизов, чтобы протестировать их различия (порты и пользователь / пароль остаются неизменными):
+
+-   20.3 LTS: `play-api-v20-3.clickhouse.tech`
+-   19.14 LTS: `play-api-v19-14.clickhouse.tech`
+
+!!! note "Примечание"
+    Для всех этих конечных точек требуется безопасное соединение TLS.
+
+## Ограничения {#limitations}
+
+Запросы выполняются под пользователем с правами `readonly`, для которого есть следующие ограничения:
 - запрещены DDL запросы
 - запрещены INSERT запросы
 
 Также установлены следующие опции:
-- [`max_result_bytes=10485760`](../operations/settings/query_complexity/#max-result-bytes)
-- [`max_result_rows=2000`](../operations/settings/query_complexity/#setting-max_result_rows)
-- [`result_overflow_mode=break`](../operations/settings/query_complexity/#result-overflow-mode)
-- [`max_execution_time=60000`](../operations/settings/query_complexity/#max-execution-time)
+- [max\_result\_bytes=10485760](../operations/settings/query_complexity/#max-result-bytes)
+- [max\_result\_rows=2000](../operations/settings/query_complexity/#setting-max_result_rows)
+- [result\_overflow\_mode=break](../operations/settings/query_complexity/#result-overflow-mode)
+- [max\_execution\_time=60000](../operations/settings/query_complexity/#max-execution-time)
 
-ClickHouse Playground соответствует конфигурации m2.small хосту
-[Managed Service for ClickHouse](https://cloud.yandex.com/services/managed-clickhouse)
-запущеному в [Яндекс.Облаке](https://cloud.yandex.com/).
-Больше информации про [облачных провайдерах](../commercial/cloud.md).
+## Примеры {#examples}
 
-Веб интерфейс ClickHouse Playground делает запросы через ClickHouse HTTP API.
-Бекендом служит обычный кластер ClickHouse.
-ClickHouse HTTP интерфейс также доступен как часть Playground.
-
-Запросы к Playground могут быть выполнены с помощью curl/wget, а также через соединеие JDBC/ODBC драйвера
-Больше информации про приложения с поддержкой ClickHouse доступно в разделе [Интерфейсы](../interfaces/index.md).
-
-| Параметр         | Значение                              |
-|:-----------------|:--------------------------------------|
-| Адрес            | https://play-api.clickhouse.tech:8443 |
-| Имя пользователя | `playground`                          |
-| Пароль           | `clickhouse`                          |
-
-Требуется SSL соединение.
+Пример конечной точки HTTPS с `curl`:
 
 ``` bash
-curl "https://play-api.clickhouse.tech:8443/?query=SELECT+'Play+ClickHouse!';&user=playground&password=clickhouse&database=datasets"
+curl "https://play-api.clickhouse.tech:8443/?query=SELECT+'Play+ClickHouse\!';&user=playground&password=clickhouse&database=datasets"
 ```
+
+Пример конечной точки TCP с [CLI](../interfaces/cli.md):
+
+``` bash
+clickhouse client --secure -h play-api.clickhouse.tech --port 9440 -u playground --password clickhouse -q "SELECT 'Play ClickHouse\!'"
+```
+
+## Детали реализации {#implementation-details}
+
+Веб-интерфейс ClickHouse Playground выполняет запросы через ClickHouse [HTTP API](../interfaces/http.md).
+Бэкэнд Playground - это кластер ClickHouse без дополнительных серверных приложений. Как упоминалось выше,  способы подключения по HTTPS и TCP/TLS общедоступны как часть Playground. Они проксируются через [Cloudflare Spectrum](https://www.cloudflare.com/products/cloudflare-spectrum/) для добавления дополнительного уровня защиты и улучшенного глобального подключения.
+
+!!! warning "Предупреждение"
+Открывать сервер ClickHouse для публичного доступа  в любой другой ситуации **настоятельно не рекомендуется**. Убедитесь, что он настроен только на частную сеть и защищен брандмауэром.

From 7d046b24e653a5d19737b422a25456ae8b50918d Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 16 Sep 2020 23:56:16 +0300
Subject: [PATCH 314/341] Improve error message for INSERT via
 clickhouse-client

With '\n...' after the query [1] clickhouse-client prefer data from the
INSERT over from stdin, and produce very tricky message:

    Code: 27. DB::Exception: Cannot parse input: expected '\n' before: ' ': (at row 1)

Well for TSV it is ok, but for RowBinary:

    Code: 33. DB::Exception: Cannot read all data. Bytes read: 1. Bytes expected: 4.

So improve error message by adding the source of data for INSERT.

  [1]: clickhouse-client -q "INSERT INTO data FORMAT TSV\n " <<<2
---
 programs/client/Client.cpp                    | 23 +++++++++++++++++--
 ...ickhouse_client_INSERT_exception.reference |  2 ++
 ...1501_clickhouse_client_INSERT_exception.sh | 15 ++++++++++++
 3 files changed, 38 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/01501_clickhouse_client_INSERT_exception.reference
 create mode 100755 tests/queries/0_stateless/01501_clickhouse_client_INSERT_exception.sh

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 0c2aca2b3c8..acb5108b60d 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -1502,7 +1502,18 @@ private:
         {
             /// Send data contained in the query.
             ReadBufferFromMemory data_in(parsed_insert_query->data, parsed_insert_query->end - parsed_insert_query->data);
-            sendDataFrom(data_in, sample, columns_description);
+            try
+            {
+                sendDataFrom(data_in, sample, columns_description);
+            }
+            catch (Exception & e)
+            {
+                /// The following query will use data from input
+                //      "INSERT INTO data FORMAT TSV\n " < data.csv
+                //  And may be pretty hard to debug, so add information about data source to make it easier.
+                e.addMessage("data for INSERT was parsed from query");
+                throw;
+            }
             // Remember where the data ended. We use this info later to determine
             // where the next query begins.
             parsed_insert_query->end = data_in.buffer().begin() + data_in.count();
@@ -1510,7 +1521,15 @@ private:
         else if (!is_interactive)
         {
             /// Send data read from stdin.
-            sendDataFrom(std_in, sample, columns_description);
+            try
+            {
+                sendDataFrom(std_in, sample, columns_description);
+            }
+            catch (Exception & e)
+            {
+                e.addMessage("data for INSERT was parsed from stdin");
+                throw;
+            }
         }
         else
             throw Exception("No data to insert", ErrorCodes::NO_DATA_TO_INSERT);
diff --git a/tests/queries/0_stateless/01501_clickhouse_client_INSERT_exception.reference b/tests/queries/0_stateless/01501_clickhouse_client_INSERT_exception.reference
new file mode 100644
index 00000000000..b258dc3d8a7
--- /dev/null
+++ b/tests/queries/0_stateless/01501_clickhouse_client_INSERT_exception.reference
@@ -0,0 +1,2 @@
+1
+10
diff --git a/tests/queries/0_stateless/01501_clickhouse_client_INSERT_exception.sh b/tests/queries/0_stateless/01501_clickhouse_client_INSERT_exception.sh
new file mode 100755
index 00000000000..5f4f9836d35
--- /dev/null
+++ b/tests/queries/0_stateless/01501_clickhouse_client_INSERT_exception.sh
@@ -0,0 +1,15 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+. "$CURDIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS data"
+${CLICKHOUSE_CLIENT} -q "CREATE TABLE data (key Int) Engine=Memory()"
+${CLICKHOUSE_CLIENT} --input_format_parallel_parsing=0 -q "INSERT INTO data SELECT key FROM input('key Int') FORMAT TSV" <<<10
+# with '\n...' after the query clickhouse-client prefer data from the query over data from stdin, and produce very tricky message:
+#   Code: 27. DB::Exception: Cannot parse input: expected '\n' before: ' ': (at row 1)
+# well for TSV it is ok, but for RowBinary:
+#   Code: 33. DB::Exception: Cannot read all data. Bytes read: 1. Bytes expected: 4.
+# so check that the exception message contain the data source.
+${CLICKHOUSE_CLIENT} --input_format_parallel_parsing=0 -q "INSERT INTO data FORMAT TSV " <<<2 |& grep -F -c 'data for INSERT was parsed from query'
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM data"

From c37b55c3b176df834144208a556f971762734a21 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Thu, 17 Sep 2020 00:19:58 +0300
Subject: [PATCH 315/341] Fix error in "extractAllGroups" function

---
 src/Functions/extractAllGroups.h                            | 6 ++++--
 .../01497_extract_all_groups_empty_match.reference          | 2 ++
 .../0_stateless/01497_extract_all_groups_empty_match.sql    | 2 ++
 3 files changed, 8 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/01497_extract_all_groups_empty_match.reference
 create mode 100644 tests/queries/0_stateless/01497_extract_all_groups_empty_match.sql

diff --git a/src/Functions/extractAllGroups.h b/src/Functions/extractAllGroups.h
index d6ec9fadb73..f1168c2ebc2 100644
--- a/src/Functions/extractAllGroups.h
+++ b/src/Functions/extractAllGroups.h
@@ -129,7 +129,9 @@ public:
                     for (size_t group = 1; group <= groups_count; ++group)
                         data_col->insertData(matched_groups[group].data(), matched_groups[group].size());
 
-                    pos = matched_groups[0].data() + matched_groups[0].size();
+                    /// If match is empty - it's technically Ok but we have to shift one character nevertheless
+                    /// to avoid infinite loop.
+                    pos = matched_groups[0].data() + std::max<size_t>(1, matched_groups[0].size());
 
                     current_nested_offset += groups_count;
                     nested_offsets_data.push_back(current_nested_offset);
@@ -167,7 +169,7 @@ public:
                     for (size_t group = 1; group <= groups_count; ++group)
                         all_matches.push_back(matched_groups[group]);
 
-                    pos = matched_groups[0].data() + matched_groups[0].size();
+                    pos = matched_groups[0].data() + std::max<size_t>(1, matched_groups[0].size());
 
                     ++matches_per_row;
                 }
diff --git a/tests/queries/0_stateless/01497_extract_all_groups_empty_match.reference b/tests/queries/0_stateless/01497_extract_all_groups_empty_match.reference
new file mode 100644
index 00000000000..3479fb7a351
--- /dev/null
+++ b/tests/queries/0_stateless/01497_extract_all_groups_empty_match.reference
@@ -0,0 +1,2 @@
+[[''],[''],[''],[''],[''],[''],['']]
+[['','','','','','','']]
diff --git a/tests/queries/0_stateless/01497_extract_all_groups_empty_match.sql b/tests/queries/0_stateless/01497_extract_all_groups_empty_match.sql
new file mode 100644
index 00000000000..1c4dafd9e2e
--- /dev/null
+++ b/tests/queries/0_stateless/01497_extract_all_groups_empty_match.sql
@@ -0,0 +1,2 @@
+SELECT extractAllGroupsVertical('@#$%^&*', '(\w*)');
+SELECT extractAllGroupsHorizontal('@#$%^&*', '(\w*)');

From 138e953429bb8915f943384c6ecc459c76281988 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 16 Sep 2020 22:58:27 +0300
Subject: [PATCH 316/341] Fix SIGSEGV for an attempt to INSERT into
 StorageFile(fd)

---
 src/Storages/StorageFile.cpp                             | 6 +++++-
 .../0_stateless/01500_StorageFile_write_to_fd.reference  | 0
 .../queries/0_stateless/01500_StorageFile_write_to_fd.sh | 9 +++++++++
 3 files changed, 14 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/01500_StorageFile_write_to_fd.reference
 create mode 100755 tests/queries/0_stateless/01500_StorageFile_write_to_fd.sh

diff --git a/src/Storages/StorageFile.cpp b/src/Storages/StorageFile.cpp
index 558216a6216..9e60d5bad15 100644
--- a/src/Storages/StorageFile.cpp
+++ b/src/Storages/StorageFile.cpp
@@ -502,8 +502,12 @@ BlockOutputStreamPtr StorageFile::write(
     if (format_name == "Distributed")
         throw Exception("Method write is not implemented for Distributed format", ErrorCodes::NOT_IMPLEMENTED);
 
+    std::string path;
+    if (!paths.empty())
+        path = paths[0];
+
     return std::make_shared<StorageFileBlockOutputStream>(*this, metadata_snapshot,
-        chooseCompressionMethod(paths[0], compression_method), context);
+        chooseCompressionMethod(path, compression_method), context);
 }
 
 Strings StorageFile::getDataPaths() const
diff --git a/tests/queries/0_stateless/01500_StorageFile_write_to_fd.reference b/tests/queries/0_stateless/01500_StorageFile_write_to_fd.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/01500_StorageFile_write_to_fd.sh b/tests/queries/0_stateless/01500_StorageFile_write_to_fd.sh
new file mode 100755
index 00000000000..589a578eb0b
--- /dev/null
+++ b/tests/queries/0_stateless/01500_StorageFile_write_to_fd.sh
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+. "$CURDIR"/../shell_config.sh
+
+# The following command will execute:
+#     CREATE TABLE table (key UInt32) ENGINE = File(TSV, stdin);
+#     INSERT INTO `table` SELECT key FROM input('key UInt32') FORMAT TSV
+${CLICKHOUSE_LOCAL} -S 'key UInt32' -q "INSERT INTO \`table\` SELECT key FROM input('key UInt32') FORMAT TSV" < /dev/null

From 13088d9befdd0e2d91764a6ba89c80bb88227138 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 17 Sep 2020 08:04:50 +0300
Subject: [PATCH 317/341] Fix 00900_parquet_load (update exception message on
 INSERT failures)

---
 .../0_stateless/00900_parquet_load.reference       | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/tests/queries/0_stateless/00900_parquet_load.reference b/tests/queries/0_stateless/00900_parquet_load.reference
index f49b74e4c3c..6cd2b1cf462 100644
--- a/tests/queries/0_stateless/00900_parquet_load.reference
+++ b/tests/queries/0_stateless/00900_parquet_load.reference
@@ -39,7 +39,7 @@
 23.0
 24.0
 === Try load data from datapage_v2.snappy.parquet
-Code: 33. DB::Ex---tion: Error while reading Parquet data: IOError: Not yet implemented: Unsupported encoding.
+Code: 33. DB::Ex---tion: Error while reading Parquet data: IOError: Not yet implemented: Unsupported encoding.: data for INSERT was parsed from stdin
 
 === Try load data from fixed_length_decimal_1.parquet
 1.0
@@ -168,22 +168,22 @@ Code: 33. DB::Ex---tion: Error while reading Parquet data: IOError: Not yet impl
 23	UNITED KINGDOM	3	eans boost carefully special requests. accounts are. carefull
 24	UNITED STATES	1	y final packages. slow foxes cajole quickly. quickly silent platelets breach ironic accounts. unusual pinto be
 === Try load data from nested_lists.snappy.parquet
-Code: 8. DB::Ex---tion: Column "element" is not presented in input data
+Code: 8. DB::Ex---tion: Column "element" is not presented in input data: data for INSERT was parsed from stdin
 
 === Try load data from nested_maps.snappy.parquet
-Code: 33. DB::Ex---tion: Error while reading Parquet data: NotImplemented: Reading lists of structs from Parquet files not yet supported: key_value: list<key_value: struct<key: string not null, value: struct<key_value: list<key_value: struct<key: int32 not null, value: bool not null> not null> not null>> not null> not null
+Code: 33. DB::Ex---tion: Error while reading Parquet data: NotImplemented: Reading lists of structs from Parquet files not yet supported: key_value: list<key_value: struct<key: string not null, value: struct<key_value: list<key_value: struct<key: int32 not null, value: bool not null> not null> not null>> not null> not null: data for INSERT was parsed from stdin
 
 === Try load data from nonnullable.impala.parquet
-Code: 8. DB::Ex---tion: Column "element" is not presented in input data
+Code: 8. DB::Ex---tion: Column "element" is not presented in input data: data for INSERT was parsed from stdin
 
 === Try load data from nullable.impala.parquet
-Code: 8. DB::Ex---tion: Column "element" is not presented in input data
+Code: 8. DB::Ex---tion: Column "element" is not presented in input data: data for INSERT was parsed from stdin
 
 === Try load data from nulls.snappy.parquet
-Code: 8. DB::Ex---tion: Column "b_c_int" is not presented in input data
+Code: 8. DB::Ex---tion: Column "b_c_int" is not presented in input data: data for INSERT was parsed from stdin
 
 === Try load data from repeated_no_annotation.parquet
-Code: 8. DB::Ex---tion: Column "number" is not presented in input data
+Code: 8. DB::Ex---tion: Column "number" is not presented in input data: data for INSERT was parsed from stdin
 
 === Try load data from userdata1.parquet
 1454486129	1	Amanda	Jordan	ajordan0@com.com	Female	1.197.201.2	6759521864920116	Indonesia	3/8/1971	49756.53	Internal Auditor	1E+02

From 9c2a8ea6d078d984fe4088b9ad749d4363579974 Mon Sep 17 00:00:00 2001
From: sundyli <543950155@qq.com>
Date: Thu, 10 Sep 2020 11:24:37 +0800
Subject: [PATCH 318/341] dynamic zookeeper config

---
 src/Interpreters/Context.cpp | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 9013dd389d9..acbc8d4fff6 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -1466,10 +1466,8 @@ zkutil::ZooKeeperPtr Context::getZooKeeper() const
 {
     std::lock_guard lock(shared->zookeeper_mutex);
 
-    if (!shared->zookeeper)
+    if (!shared->zookeeper || shared->zookeeper->expired())
         shared->zookeeper = std::make_shared<zkutil::ZooKeeper>(getConfigRef(), "zookeeper");
-    else if (shared->zookeeper->expired())
-        shared->zookeeper = shared->zookeeper->startNewSession();
 
     return shared->zookeeper;
 }

From 544b2cb20d2056cc03740d6f7962b37dfdb39a70 Mon Sep 17 00:00:00 2001
From: sundy-li <543950155@qq.com>
Date: Thu, 10 Sep 2020 04:00:33 +0000
Subject: [PATCH 319/341] add configChanged method for zookeeper

fix logic error && skip reload testkeeper
---
 programs/server/Server.cpp                    |   3 +
 src/Common/ZooKeeper/ZooKeeper.cpp            |  12 ++
 src/Common/ZooKeeper/ZooKeeper.h              |   4 +-
 src/Interpreters/Context.cpp                  |  13 +-
 src/Interpreters/Context.h                    |   2 +
 tests/integration/helpers/cluster.py          |  10 ++
 .../test_reload_zookeeper/__init__.py         |   0
 .../test_reload_zookeeper/configs/config.xml  |  31 +++++
 .../test_reload_zookeeper/configs/users.xml   |  23 ++++
 .../configs/zookeeper.xml                     |  19 +++
 .../integration/test_reload_zookeeper/test.py | 120 ++++++++++++++++++
 11 files changed, 235 insertions(+), 2 deletions(-)
 create mode 100644 tests/integration/test_reload_zookeeper/__init__.py
 create mode 100644 tests/integration/test_reload_zookeeper/configs/config.xml
 create mode 100644 tests/integration/test_reload_zookeeper/configs/users.xml
 create mode 100644 tests/integration/test_reload_zookeeper/configs/zookeeper.xml
 create mode 100644 tests/integration/test_reload_zookeeper/test.py

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 56778b8dd69..aa947b22593 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -538,6 +538,9 @@ int Server::main(const std::vector<std::string> & /*args*/)
             if (config->has("max_partition_size_to_drop"))
                 global_context->setMaxPartitionSizeToDrop(config->getUInt64("max_partition_size_to_drop"));
 
+            if (config->has("zookeeper"))
+                global_context->reloadZooKeeperIfChanged(config);
+
             global_context->updateStorageConfiguration(*config);
         },
         /* already_loaded = */ true);
diff --git a/src/Common/ZooKeeper/ZooKeeper.cpp b/src/Common/ZooKeeper/ZooKeeper.cpp
index e50aa8f1700..41d715b23f1 100644
--- a/src/Common/ZooKeeper/ZooKeeper.cpp
+++ b/src/Common/ZooKeeper/ZooKeeper.cpp
@@ -200,6 +200,18 @@ ZooKeeper::ZooKeeper(const Poco::Util::AbstractConfiguration & config, const std
     init(args.implementation, args.hosts, args.identity, args.session_timeout_ms, args.operation_timeout_ms, args.chroot);
 }
 
+bool ZooKeeper::configChanged(const Poco::Util::AbstractConfiguration & config, const std::string & config_name) const
+{
+    ZooKeeperArgs args(config, config_name);
+
+    // skip reload testkeeper cause it's for test and data in memory
+    if (args.implementation == implementation && implementation == "testkeeper")
+        return false;
+
+    return std::tie(args.implementation, args.hosts, args.identity, args.session_timeout_ms, args.operation_timeout_ms, args.chroot)
+        != std::tie(implementation, hosts, identity, session_timeout_ms, operation_timeout_ms, chroot);
+}
+
 
 static Coordination::WatchCallback callbackForEvent(const EventPtr & watch)
 {
diff --git a/src/Common/ZooKeeper/ZooKeeper.h b/src/Common/ZooKeeper/ZooKeeper.h
index b2e49bee346..b1a69646db5 100644
--- a/src/Common/ZooKeeper/ZooKeeper.h
+++ b/src/Common/ZooKeeper/ZooKeeper.h
@@ -56,7 +56,7 @@ public:
               int32_t session_timeout_ms_ = DEFAULT_SESSION_TIMEOUT,
               int32_t operation_timeout_ms_ = DEFAULT_OPERATION_TIMEOUT,
               const std::string & chroot_ = "",
-              const std::string & implementation = "zookeeper");
+              const std::string & implementation_ = "zookeeper");
 
     /** Config of the form:
         <zookeeper>
@@ -87,6 +87,8 @@ public:
     /// This object remains unchanged, and the new session is returned.
     Ptr startNewSession() const;
 
+    bool configChanged(const Poco::Util::AbstractConfiguration & config, const std::string & config_name) const;
+
     /// Returns true, if the session has expired.
     bool expired();
 
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index acbc8d4fff6..ab511acda76 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -1466,8 +1466,10 @@ zkutil::ZooKeeperPtr Context::getZooKeeper() const
 {
     std::lock_guard lock(shared->zookeeper_mutex);
 
-    if (!shared->zookeeper || shared->zookeeper->expired())
+    if (!shared->zookeeper)
         shared->zookeeper = std::make_shared<zkutil::ZooKeeper>(getConfigRef(), "zookeeper");
+    else if (shared->zookeeper->expired())
+        shared->zookeeper = shared->zookeeper->startNewSession();
 
     return shared->zookeeper;
 }
@@ -1496,6 +1498,15 @@ void Context::resetZooKeeper() const
     shared->zookeeper.reset();
 }
 
+void Context::reloadZooKeeperIfChanged(const ConfigurationPtr & config) const
+{
+    std::lock_guard lock(shared->zookeeper_mutex);
+    if (!shared->zookeeper || shared->zookeeper->configChanged(*config, "zookeeper"))
+    {
+        shared->zookeeper = std::make_shared<zkutil::ZooKeeper>(*config, "zookeeper");
+    }
+}
+
 bool Context::hasZooKeeper() const
 {
     return getConfigRef().has("zookeeper");
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index ff2af111885..7200bf57e6e 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -476,6 +476,8 @@ public:
     bool hasZooKeeper() const;
     /// Reset current zookeeper session. Do not create a new one.
     void resetZooKeeper() const;
+    // Reload Zookeeper
+    void reloadZooKeeperIfChanged(const ConfigurationPtr & config) const;
 
     /// Create a cache of uncompressed blocks of specified size. This can be done only once.
     void setUncompressedCache(size_t max_size_in_bytes);
diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index f5d9290a17e..6d0f038daed 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -763,6 +763,16 @@ class ClickHouseCluster:
     def add_zookeeper_startup_command(self, command):
         self.pre_zookeeper_commands.append(command)
 
+    def stop_zookeeper_nodes(self, zk_nodes):
+        for n in zk_nodes:
+            logging.info("Stopping zookeeper node: %s", n)
+            subprocess_check_call(self.base_zookeeper_cmd + ["stop", n])
+
+    def start_zookeeper_nodes(self, zk_nodes):
+        for n in zk_nodes:
+            logging.info("Starting zookeeper node: %s", n)
+            subprocess_check_call(self.base_zookeeper_cmd + ["start", n])
+
 
 CLICKHOUSE_START_COMMAND = "clickhouse server --config-file=/etc/clickhouse-server/config.xml --log-file=/var/log/clickhouse-server/clickhouse-server.log --errorlog-file=/var/log/clickhouse-server/clickhouse-server.err.log"
 
diff --git a/tests/integration/test_reload_zookeeper/__init__.py b/tests/integration/test_reload_zookeeper/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_reload_zookeeper/configs/config.xml b/tests/integration/test_reload_zookeeper/configs/config.xml
new file mode 100644
index 00000000000..b5e5495c096
--- /dev/null
+++ b/tests/integration/test_reload_zookeeper/configs/config.xml
@@ -0,0 +1,31 @@
+<?xml version="1.0"?>
+<yandex>
+    <logger>
+        <level>trace</level>
+        <log>/var/log/clickhouse-server/clickhouse-server.log</log>
+        <errorlog>/var/log/clickhouse-server/clickhouse-server.err.log</errorlog>
+        <size>1000M</size>
+        <count>10</count>
+    </logger>
+
+    <tcp_port>9000</tcp_port>
+    <listen_host>127.0.0.1</listen_host>
+
+    <openSSL>
+        <client>
+            <cacheSessions>true</cacheSessions>
+            <verificationMode>none</verificationMode>
+            <invalidCertificateHandler>
+                <name>AcceptCertificateHandler</name>
+            </invalidCertificateHandler>
+        </client>
+    </openSSL>
+
+    <max_concurrent_queries>500</max_concurrent_queries>
+    <mark_cache_size>5368709120</mark_cache_size>
+    <path>./clickhouse/</path>
+    <users_config>users.xml</users_config>
+
+    <max_table_size_to_drop>1</max_table_size_to_drop>
+    <max_partition_size_to_drop>1</max_partition_size_to_drop>
+</yandex>
diff --git a/tests/integration/test_reload_zookeeper/configs/users.xml b/tests/integration/test_reload_zookeeper/configs/users.xml
new file mode 100644
index 00000000000..6061af8e33d
--- /dev/null
+++ b/tests/integration/test_reload_zookeeper/configs/users.xml
@@ -0,0 +1,23 @@
+<?xml version="1.0"?>
+<yandex>
+    <profiles>
+        <default>
+        </default>
+    </profiles>
+
+    <users>
+        <default>
+            <password></password>
+            <networks incl="networks" replace="replace">
+                <ip>::/0</ip>
+            </networks>
+            <profile>default</profile>
+            <quota>default</quota>
+        </default>
+    </users>
+
+    <quotas>
+        <default>
+        </default>
+    </quotas>
+</yandex>
diff --git a/tests/integration/test_reload_zookeeper/configs/zookeeper.xml b/tests/integration/test_reload_zookeeper/configs/zookeeper.xml
new file mode 100644
index 00000000000..ecadd4c74c3
--- /dev/null
+++ b/tests/integration/test_reload_zookeeper/configs/zookeeper.xml
@@ -0,0 +1,19 @@
+
+<yandex>
+    <zookeeper>
+        <node index="1">
+            <host>zoo1</host>
+            <port>2181</port>
+        </node>
+        <node index="2">
+            <host>zoo2</host>
+            <port>2181</port>
+        </node>
+            <node index="3">
+            <host>zoo3</host>
+            <port>2181</port>
+        </node>
+        <session_timeout_ms>2000</session_timeout_ms>
+    </zookeeper>
+</yandex>
+    
\ No newline at end of file
diff --git a/tests/integration/test_reload_zookeeper/test.py b/tests/integration/test_reload_zookeeper/test.py
new file mode 100644
index 00000000000..66df5a1a126
--- /dev/null
+++ b/tests/integration/test_reload_zookeeper/test.py
@@ -0,0 +1,120 @@
+import time
+import pytest
+import os
+
+from helpers.cluster import ClickHouseCluster
+from helpers.client import QueryRuntimeException
+from helpers.test_tools import assert_eq_with_retry
+
+
+cluster = ClickHouseCluster(__file__, zookeeper_config_path='configs/zookeeper.xml')
+node = cluster.add_instance('node', with_zookeeper=True)
+
+SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
+ZK_CONFIG_PATH = os.path.join(SCRIPT_DIR, 'configs/zookeeper.xml')
+
+
+@pytest.fixture(scope="module")
+def start_cluster():
+    try:
+        cluster.start()
+        node.query(
+    '''
+        CREATE TABLE test_table(date Date, id UInt32)
+        ENGINE = ReplicatedMergeTree('/clickhouse/tables/shard1/test/test_table', '1')
+        PARTITION BY toYYYYMM(date)
+        ORDER BY id
+    ''')
+
+        yield cluster
+    finally:
+        ## write back the configs
+        config = open(ZK_CONFIG_PATH, 'w')
+        config.write(
+"""
+<yandex>
+    <zookeeper>
+        <node index="1">
+            <host>zoo1</host>
+            <port>2181</port>
+        </node>
+        <node index="2">
+            <host>zoo2</host>
+            <port>2181</port>
+        </node>
+            <node index="3">
+            <host>zoo3</host>
+            <port>2181</port>
+        </node>
+        <session_timeout_ms>2000</session_timeout_ms>
+    </zookeeper>
+</yandex>
+    """)
+        config.close()
+        cluster.shutdown()
+
+def test_reload_zookeeper(start_cluster):
+
+    def wait_zookeeper_node_to_start(zk_nodes, timeout=60):
+        start = time.time()
+        while time.time() - start < timeout:
+            try:
+                for instance in zk_nodes:
+                    conn = start_cluster.get_kazoo_client(instance)
+                    conn.get_children('/')
+                print("All instances of ZooKeeper started")
+                return
+            except Exception as ex:
+                print("Can't connect to ZooKeeper " + str(ex))
+                time.sleep(0.5)
+
+    node.query("INSERT INTO test_table(date, id) select today(), number FROM numbers(1000)")
+
+    ## remove zoo2, zoo3 from configs
+    config = open(ZK_CONFIG_PATH, 'w')
+    config.write(
+"""
+<yandex>
+    <zookeeper>
+        <node index="1">
+            <host>zoo1</host>
+            <port>2181</port>
+        </node>
+        <session_timeout_ms>2000</session_timeout_ms>
+    </zookeeper>
+</yandex >
+"""
+    )
+    config.close()
+    ## config reloads, but can still work
+    assert_eq_with_retry(node, "SELECT COUNT() FROM test_table", '1000', retry_count=120, sleep_time=0.5)
+
+    ## stop all zookeepers, table will be readonly
+    cluster.stop_zookeeper_nodes(["zoo1", "zoo2", "zoo3"])
+    with pytest.raises(QueryRuntimeException):
+        node.query("SELECT COUNT() FROM test_table")
+
+    ## start zoo2, zoo3, table will be readonly too, because it only connect to zoo1
+    cluster.start_zookeeper_nodes(["zoo2", "zoo3"])
+    wait_zookeeper_node_to_start(["zoo2", "zoo3"])
+    with pytest.raises(QueryRuntimeException):
+        node.query("SELECT COUNT() FROM test_table")
+
+    ## set config to zoo2, server will be normal
+    config = open(ZK_CONFIG_PATH, 'w')
+    config.write(
+"""
+<yandex>
+    <zookeeper>
+        <node index="1">
+            <host>zoo2</host>
+            <port>2181</port>
+        </node>
+        <session_timeout_ms>2000</session_timeout_ms>
+    </zookeeper>
+</yandex>
+"""
+    )
+    config.close()
+    assert_eq_with_retry(node, "SELECT COUNT() FROM test_table", '1000', retry_count=120, sleep_time=0.5)
+

From 0c81a8777e17705032d69a1744fb8f6d9e5201b2 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Thu, 17 Sep 2020 14:21:38 +0800
Subject: [PATCH 320/341] Fix review comment

---
 src/Core/MySQL/MySQLReplication.cpp | 51 ++++++++++++++---------------
 src/Core/MySQL/MySQLReplication.h   | 34 ++++++++++++-------
 2 files changed, 46 insertions(+), 39 deletions(-)

diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index c874f0aad67..824440b3dd0 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -15,6 +15,7 @@ namespace ErrorCodes
 {
     extern const int UNKNOWN_EXCEPTION;
     extern const int LOGICAL_ERROR;
+    extern const int ATTEMPT_TO_READ_AFTER_EOF;
 }
 
 namespace MySQLReplication
@@ -800,6 +801,9 @@ namespace MySQLReplication
 
     void MySQLFlavor::readPayloadImpl(ReadBuffer & payload)
     {
+        if (payload.eof())
+            throw Exception("Attempt to read after EOF.", ErrorCodes::ATTEMPT_TO_READ_AFTER_EOF);
+
         UInt16 header = static_cast<unsigned char>(*payload.position());
         switch (header)
         {
@@ -810,33 +814,33 @@ namespace MySQLReplication
                 err.readPayloadWithUnpacked(payload);
                 throw ReplicationError(err.error_message, ErrorCodes::UNKNOWN_EXCEPTION);
         }
-        // skip the header flag.
+        // skip the generic response packets header flag.
         payload.ignore(1);
 
         MySQLBinlogEventReadBuffer event_payload(payload);
-        EventType event_type = static_cast<EventType>(*(event_payload.position() + 4));
-        switch (event_type)
+
+        EventHeader event_header;
+        event_header.parse(event_payload);
+
+        switch (event_header.type)
         {
             case FORMAT_DESCRIPTION_EVENT:
             {
-                event = std::make_shared<FormatDescriptionEvent>();
-                event->parseHeader(event_payload);
+                event = std::make_shared<FormatDescriptionEvent>(std::move(event_header));
                 event->parseEvent(event_payload);
                 position.update(event);
                 break;
             }
             case ROTATE_EVENT:
             {
-                event = std::make_shared<RotateEvent>();
-                event->parseHeader(event_payload);
+                event = std::make_shared<RotateEvent>(std::move(event_header));
                 event->parseEvent(event_payload);
                 position.update(event);
                 break;
             }
             case QUERY_EVENT:
             {
-                event = std::make_shared<QueryEvent>();
-                event->parseHeader(event_payload);
+                event = std::make_shared<QueryEvent>(std::move(event_header));
                 event->parseEvent(event_payload);
 
                 auto query = std::static_pointer_cast<QueryEvent>(event);
@@ -845,7 +849,7 @@ namespace MySQLReplication
                     case QUERY_EVENT_MULTI_TXN_FLAG:
                     case QUERY_EVENT_XA:
                     {
-                        event = std::make_shared<DryRunEvent>();
+                        event = std::make_shared<DryRunEvent>(std::move(query->header));
                         break;
                     }
                     default:
@@ -855,16 +859,14 @@ namespace MySQLReplication
             }
             case XID_EVENT:
             {
-                event = std::make_shared<XIDEvent>();
-                event->parseHeader(event_payload);
+                event = std::make_shared<XIDEvent>(std::move(event_header));
                 event->parseEvent(event_payload);
                 position.update(event);
                 break;
             }
             case TABLE_MAP_EVENT:
             {
-                event = std::make_shared<TableMapEvent>();
-                event->parseHeader(event_payload);
+                event = std::make_shared<TableMapEvent>(std::move(event_header));
                 event->parseEvent(event_payload);
                 table_map = std::static_pointer_cast<TableMapEvent>(event);
                 break;
@@ -873,11 +875,10 @@ namespace MySQLReplication
             case WRITE_ROWS_EVENT_V2:
             {
                 if (do_replicate())
-                    event = std::make_shared<WriteRowsEvent>(table_map);
+                    event = std::make_shared<WriteRowsEvent>(table_map, std::move(event_header));
                 else
-                    event = std::make_shared<DryRunEvent>();
+                    event = std::make_shared<DryRunEvent>(std::move(event_header));
 
-                event->parseHeader(event_payload);
                 event->parseEvent(event_payload);
                 break;
             }
@@ -885,11 +886,10 @@ namespace MySQLReplication
             case DELETE_ROWS_EVENT_V2:
             {
                 if (do_replicate())
-                    event = std::make_shared<DeleteRowsEvent>(table_map);
+                    event = std::make_shared<DeleteRowsEvent>(table_map, std::move(event_header));
                 else
-                    event = std::make_shared<DryRunEvent>();
+                    event = std::make_shared<DryRunEvent>(std::move(event_header));
 
-                event->parseHeader(event_payload);
                 event->parseEvent(event_payload);
                 break;
             }
@@ -897,26 +897,23 @@ namespace MySQLReplication
             case UPDATE_ROWS_EVENT_V2:
             {
                 if (do_replicate())
-                    event = std::make_shared<UpdateRowsEvent>(table_map);
+                    event = std::make_shared<UpdateRowsEvent>(table_map, std::move(event_header));
                 else
-                    event = std::make_shared<DryRunEvent>();
+                    event = std::make_shared<DryRunEvent>(std::move(event_header));
 
-                event->parseHeader(event_payload);
                 event->parseEvent(event_payload);
                 break;
             }
             case GTID_EVENT:
             {
-                event = std::make_shared<GTIDEvent>();
-                event->parseHeader(event_payload);
+                event = std::make_shared<GTIDEvent>(std::move(event_header));
                 event->parseEvent(event_payload);
                 position.update(event);
                 break;
             }
             default:
             {
-                event = std::make_shared<DryRunEvent>();
-                event->parseHeader(event_payload);
+                event = std::make_shared<DryRunEvent>(std::move(event_header));
                 event->parseEvent(event_payload);
                 break;
             }
diff --git a/src/Core/MySQL/MySQLReplication.h b/src/Core/MySQL/MySQLReplication.h
index 5f5ff23d0d9..fbcd67105ed 100644
--- a/src/Core/MySQL/MySQLReplication.h
+++ b/src/Core/MySQL/MySQLReplication.h
@@ -300,9 +300,10 @@ namespace MySQLReplication
     public:
         EventHeader header;
 
+        EventBase(EventHeader && header_) : header(std::move(header_)) {}
+
         virtual ~EventBase() = default;
         virtual void dump(std::ostream & out) const = 0;
-        virtual void parseHeader(ReadBuffer & payload) { header.parse(payload); }
         virtual void parseEvent(ReadBuffer & payload) { parseImpl(payload); }
         virtual MySQLEventType type() const { return MYSQL_UNHANDLED_EVENT; }
 
@@ -313,7 +314,10 @@ namespace MySQLReplication
     class FormatDescriptionEvent : public EventBase
     {
     public:
-        FormatDescriptionEvent() : binlog_version(0), create_timestamp(0), event_header_length(0) { }
+        FormatDescriptionEvent(EventHeader && header_)
+            : EventBase(std::move(header_)), binlog_version(0), create_timestamp(0), event_header_length(0)
+        {
+        }
 
     protected:
         UInt16 binlog_version;
@@ -335,7 +339,7 @@ namespace MySQLReplication
         UInt64 position;
         String next_binlog;
 
-        RotateEvent() : position(0) { }
+        RotateEvent(EventHeader && header_) : EventBase(std::move(header_)), position(0) {}
         void dump(std::ostream & out) const override;
 
     protected:
@@ -362,7 +366,11 @@ namespace MySQLReplication
         String query;
         QueryType typ = QUERY_EVENT_DDL;
 
-        QueryEvent() : thread_id(0), exec_time(0), schema_len(0), error_code(0), status_len(0) { }
+        QueryEvent(EventHeader && header_)
+            : EventBase(std::move(header_)), thread_id(0), exec_time(0), schema_len(0), error_code(0), status_len(0)
+        {
+        }
+
         void dump(std::ostream & out) const override;
         MySQLEventType type() const override { return MYSQL_QUERY_EVENT; }
 
@@ -373,7 +381,7 @@ namespace MySQLReplication
     class XIDEvent : public EventBase
     {
     public:
-        XIDEvent() : xid(0) { }
+        XIDEvent(EventHeader && header_) : EventBase(std::move(header_)), xid(0) {}
 
     protected:
         UInt64 xid;
@@ -396,7 +404,7 @@ namespace MySQLReplication
         std::vector<UInt16> column_meta;
         Bitmap null_bitmap;
 
-        TableMapEvent() : table_id(0), flags(0), schema_len(0), table_len(0), column_count(0) { }
+        TableMapEvent(EventHeader && header_) : EventBase(std::move(header_)), table_id(0), flags(0), schema_len(0), table_len(0), column_count(0) {}
         void dump(std::ostream & out) const override;
 
     protected:
@@ -412,8 +420,8 @@ namespace MySQLReplication
         String table;
         std::vector<Field> rows;
 
-        RowsEvent(std::shared_ptr<TableMapEvent> table_map_)
-            : number_columns(0), table_id(0), flags(0), extra_data_len(0), table_map(table_map_)
+        RowsEvent(std::shared_ptr<TableMapEvent> table_map_, EventHeader && header_)
+            : EventBase(std::move(header_)), number_columns(0), table_id(0), flags(0), extra_data_len(0), table_map(table_map_)
         {
             schema = table_map->schema;
             table = table_map->table;
@@ -438,21 +446,21 @@ namespace MySQLReplication
     class WriteRowsEvent : public RowsEvent
     {
     public:
-        WriteRowsEvent(std::shared_ptr<TableMapEvent> table_map_) : RowsEvent(table_map_) { }
+        WriteRowsEvent(std::shared_ptr<TableMapEvent> table_map_, EventHeader && header_) : RowsEvent(table_map_, std::move(header_)) {}
         MySQLEventType type() const override { return MYSQL_WRITE_ROWS_EVENT; }
     };
 
     class DeleteRowsEvent : public RowsEvent
     {
     public:
-        DeleteRowsEvent(std::shared_ptr<TableMapEvent> table_map_) : RowsEvent(table_map_) { }
+        DeleteRowsEvent(std::shared_ptr<TableMapEvent> table_map_, EventHeader && header_) : RowsEvent(table_map_, std::move(header_)) {}
         MySQLEventType type() const override { return MYSQL_DELETE_ROWS_EVENT; }
     };
 
     class UpdateRowsEvent : public RowsEvent
     {
     public:
-        UpdateRowsEvent(std::shared_ptr<TableMapEvent> table_map_) : RowsEvent(table_map_) { }
+        UpdateRowsEvent(std::shared_ptr<TableMapEvent> table_map_, EventHeader && header_) : RowsEvent(table_map_, std::move(header_)) {}
         MySQLEventType type() const override { return MYSQL_UPDATE_ROWS_EVENT; }
     };
 
@@ -462,7 +470,7 @@ namespace MySQLReplication
         UInt8 commit_flag;
         GTID gtid;
 
-        GTIDEvent() : commit_flag(0) { }
+        GTIDEvent(EventHeader && header_) : EventBase(std::move(header_)), commit_flag(0) {}
         void dump(std::ostream & out) const override;
 
     protected:
@@ -471,6 +479,8 @@ namespace MySQLReplication
 
     class DryRunEvent : public EventBase
     {
+    public:
+        DryRunEvent(EventHeader && header_) : EventBase(std::move(header_)) {}
         void dump(std::ostream & out) const override;
 
     protected:

From c5b56c24f83bde0a70e4304bf13d4e723218db67 Mon Sep 17 00:00:00 2001
From: zhang2014 <coswde@gmail.com>
Date: Thu, 17 Sep 2020 14:44:05 +0800
Subject: [PATCH 321/341] ISSUES-14894 fix MaterializeMySQL temp metadata file
 exists

---
 src/Databases/MySQL/MaterializeMetadata.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Databases/MySQL/MaterializeMetadata.cpp b/src/Databases/MySQL/MaterializeMetadata.cpp
index 74fd59dc98e..3c5bfdec594 100644
--- a/src/Databases/MySQL/MaterializeMetadata.cpp
+++ b/src/Databases/MySQL/MaterializeMetadata.cpp
@@ -145,7 +145,7 @@ void MaterializeMetadata::transaction(const MySQLReplication::Position & positio
     String persistent_tmp_path = persistent_path + ".tmp";
 
     {
-        WriteBufferFromFile out(persistent_tmp_path, DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_TRUNC | O_CREAT | O_EXCL);
+        WriteBufferFromFile out(persistent_tmp_path, DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_TRUNC | O_CREAT);
 
         /// TSV format metadata file.
         writeString("Version:\t" + toString(meta_version), out);

From 4348dca960c9d63fc30abfab41281aa9d5b68782 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Thu, 17 Sep 2020 10:07:58 +0300
Subject: [PATCH 322/341] Update ci_config.json

---
 tests/ci/ci_config.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/ci_config.json b/tests/ci/ci_config.json
index 15ba05c4efe..034ed0ea3da 100644
--- a/tests/ci/ci_config.json
+++ b/tests/ci/ci_config.json
@@ -12,7 +12,7 @@
             "with_coverage": false
         },
         {
-            "compiler": "clang-11",
+            "compiler": "gcc-10",
             "build-type": "",
             "sanitizer": "",
             "package-type": "performance",

From 6d3e6dadfac20aa39891729931dabc6b1bcb8d2e Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Thu, 17 Sep 2020 11:18:00 +0300
Subject: [PATCH 323/341] Update has.

---
 src/Functions/GatherUtils/has_all.cpp    | 4 ++++
 src/Functions/GatherUtils/has_any.cpp    | 4 ++++
 src/Functions/GatherUtils/has_substr.cpp | 4 ++++
 3 files changed, 12 insertions(+)

diff --git a/src/Functions/GatherUtils/has_all.cpp b/src/Functions/GatherUtils/has_all.cpp
index ae2e6c7af42..491631d0c7c 100644
--- a/src/Functions/GatherUtils/has_all.cpp
+++ b/src/Functions/GatherUtils/has_all.cpp
@@ -5,6 +5,9 @@
 namespace DB::GatherUtils
 {
 
+namespace
+{
+
 struct ArrayHasAllSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasAllSelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
@@ -14,6 +17,7 @@ struct ArrayHasAllSelectArraySourcePair : public ArraySourcePairSelector<ArrayHa
     }
 };
 
+}
 
 void sliceHasAll(IArraySource & first, IArraySource & second, ColumnUInt8 & result)
 {
diff --git a/src/Functions/GatherUtils/has_any.cpp b/src/Functions/GatherUtils/has_any.cpp
index a25acdd666a..6ad0eeb8dc0 100644
--- a/src/Functions/GatherUtils/has_any.cpp
+++ b/src/Functions/GatherUtils/has_any.cpp
@@ -5,6 +5,9 @@
 namespace DB::GatherUtils
 {
 
+namespace
+{
+
 struct ArrayHasAnySelectArraySourcePair : public ArraySourcePairSelector<ArrayHasAnySelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
@@ -14,6 +17,7 @@ struct ArrayHasAnySelectArraySourcePair : public ArraySourcePairSelector<ArrayHa
     }
 };
 
+}
 
 void sliceHasAny(IArraySource & first, IArraySource & second, ColumnUInt8 & result)
 {
diff --git a/src/Functions/GatherUtils/has_substr.cpp b/src/Functions/GatherUtils/has_substr.cpp
index 27c15c5b786..fe16c423428 100644
--- a/src/Functions/GatherUtils/has_substr.cpp
+++ b/src/Functions/GatherUtils/has_substr.cpp
@@ -5,6 +5,9 @@
 namespace DB::GatherUtils
 {
 
+namespace
+{
+
 struct ArrayHasSubstrSelectArraySourcePair : public ArraySourcePairSelector<ArrayHasSubstrSelectArraySourcePair>
 {
     template <typename FirstSource, typename SecondSource>
@@ -14,6 +17,7 @@ struct ArrayHasSubstrSelectArraySourcePair : public ArraySourcePairSelector<Arra
     }
 };
 
+}
 
 void sliceHasSubstr(IArraySource & first, IArraySource & second, ColumnUInt8 & result)
 {

From 35e8ee5f8597fa36ef942c23bb67aa309d3d0c60 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Thu, 17 Sep 2020 12:20:23 +0300
Subject: [PATCH 324/341] Rollback inlining.

---
 src/Functions/GatherUtils/Algorithms.h | 63 +++++++++++++-------------
 1 file changed, 32 insertions(+), 31 deletions(-)

diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index b9cca7686ad..769d23b66dc 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -21,10 +21,11 @@ namespace DB::GatherUtils
 
 inline constexpr size_t MAX_ARRAY_SIZE = 1 << 30;
 
+
 /// Methods to copy Slice to Sink, overloaded for various combinations of types.
 
 template <typename T>
-void inline ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<T> & sink)
+void writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<T> & sink)
 {
     sink.elements.resize(sink.current_offset + slice.size);
     memcpySmallAllowReadWriteOverflow15(&sink.elements[sink.current_offset], slice.data, slice.size * sizeof(T));
@@ -32,7 +33,7 @@ void inline ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, Numeric
 }
 
 template <typename T, typename U>
-void inline ALWAYS_INLINE writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<U> & sink)
+void writeSlice(const NumericArraySlice<T> & slice, NumericArraySink<U> & sink)
 {
     using NativeU = typename NativeType<U>::Type;
 
@@ -145,7 +146,7 @@ inline ALWAYS_INLINE void writeSlice(const Slice & slice, NullableArraySink<Arra
 
 
 template <typename T, typename U>
-void inline ALWAYS_INLINE writeSlice(const NumericValueSlice<T> & slice, NumericArraySink<U> & sink)
+void writeSlice(const NumericValueSlice<T> & slice, NumericArraySink<U> & sink)
 {
     sink.elements.resize(sink.current_offset + 1);
     sink.elements[sink.current_offset] = slice.value;
@@ -186,7 +187,7 @@ inline ALWAYS_INLINE void writeSlice(const NumericValueSlice<T> & slice, Generic
 
 
 template <typename SourceA, typename SourceB, typename Sink>
-void inline ALWAYS_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sink)
+void NO_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sink)
 {
     sink.reserve(src_a.getSizeForReserve() + src_b.getSizeForReserve());
 
@@ -202,7 +203,7 @@ void inline ALWAYS_INLINE concat(SourceA && src_a, SourceB && src_b, Sink && sin
 }
 
 template <typename Source, typename Sink>
-void inline ALWAYS_INLINE concat(const std::vector<std::unique_ptr<IArraySource>> & array_sources, Sink && sink)
+void concat(const std::vector<std::unique_ptr<IArraySource>> & array_sources, Sink && sink)
 {
     size_t sources_num = array_sources.size();
     std::vector<char> is_const(sources_num);
@@ -250,7 +251,7 @@ void inline ALWAYS_INLINE concat(const std::vector<std::unique_ptr<IArraySource>
 }
 
 template <typename Sink>
-void inline ALWAYS_INLINE concat(StringSources & sources, Sink && sink)
+void NO_INLINE concat(StringSources & sources, Sink && sink)
 {
     while (!sink.isEnd())
     {
@@ -265,7 +266,7 @@ void inline ALWAYS_INLINE concat(StringSources & sources, Sink && sink)
 
 
 template <typename Source, typename Sink>
-void inline ALWAYS_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
+void NO_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
 {
     while (!src.isEnd())
     {
@@ -276,7 +277,7 @@ void inline ALWAYS_INLINE sliceFromLeftConstantOffsetUnbounded(Source && src, Si
 }
 
 template <typename Source, typename Sink>
-void inline ALWAYS_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
+void NO_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
 {
     while (!src.isEnd())
     {
@@ -293,7 +294,7 @@ void inline ALWAYS_INLINE sliceFromLeftConstantOffsetBounded(Source && src, Sink
 }
 
 template <typename Source, typename Sink>
-void inline ALWAYS_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
+void NO_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, Sink && sink, size_t offset)
 {
     while (!src.isEnd())
     {
@@ -304,7 +305,7 @@ void inline ALWAYS_INLINE sliceFromRightConstantOffsetUnbounded(Source && src, S
 }
 
 template <typename Source, typename Sink>
-void inline ALWAYS_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
+void NO_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sink && sink, size_t offset, ssize_t length)
 {
     while (!src.isEnd())
     {
@@ -321,7 +322,7 @@ void inline ALWAYS_INLINE sliceFromRightConstantOffsetBounded(Source && src, Sin
 }
 
 template <typename Source, typename Sink>
-void inline ALWAYS_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sink, const IColumn & offset_column)
+void NO_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sink, const IColumn & offset_column)
 {
     const bool is_null = offset_column.onlyNull();
     const auto * nullable = typeid_cast<const ColumnNullable *>(&offset_column);
@@ -352,7 +353,7 @@ void inline ALWAYS_INLINE sliceDynamicOffsetUnbounded(Source && src, Sink && sin
 }
 
 template <typename Source, typename Sink>
-void inline ALWAYS_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink, const IColumn & offset_column, const IColumn & length_column)
+void NO_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink, const IColumn & offset_column, const IColumn & length_column)
 {
     const bool is_offset_null = offset_column.onlyNull();
     const auto * offset_nullable = typeid_cast<const ColumnNullable *>(&offset_column);
@@ -394,7 +395,7 @@ void inline ALWAYS_INLINE sliceDynamicOffsetBounded(Source && src, Sink && sink,
 
 
 template <typename SourceA, typename SourceB, typename Sink>
-void inline ALWAYS_INLINE conditional(SourceA && src_a, SourceB && src_b, Sink && sink, const PaddedPODArray<UInt8> & condition)
+void NO_INLINE conditional(SourceA && src_a, SourceB && src_b, Sink && sink, const PaddedPODArray<UInt8> & condition)
 {
     sink.reserve(std::max(src_a.getSizeForReserve(), src_b.getSizeForReserve()));
 
@@ -422,7 +423,7 @@ template <
     typename FirstSliceType,
     typename SecondSliceType,
           bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t)>
-bool inline ALWAYS_INLINE sliceHasImplAnyAll(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool sliceHasImplAnyAll(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     const bool has_first_null_map = first_null_map != nullptr;
     const bool has_second_null_map = second_null_map != nullptr;
@@ -456,7 +457,7 @@ bool inline ALWAYS_INLINE sliceHasImplAnyAll(const FirstSliceType & first, const
 /// https://en.wikipedia.org/wiki/Knuth%E2%80%93Morris%E2%80%93Pratt_algorithm.
 /// A "prefix-function" is defined as: i-th element is the length of the longest of all prefixes that end in i-th position
 template <typename SliceType, typename EqualityFunc>
-std::vector<size_t> inline ALWAYS_INLINE buildKMPPrefixFunction(const SliceType & pattern, const EqualityFunc & isEqualFunc)
+std::vector<size_t> buildKMPPrefixFunction(const SliceType & pattern, const EqualityFunc & isEqualFunc)
 {
     std::vector<size_t> result(pattern.size);
     result[0] = 0;
@@ -483,7 +484,7 @@ template < typename FirstSliceType,
            typename SecondSliceType,
            bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t),
            bool (*isEqualUnary)(const SecondSliceType &, size_t, size_t)>
-bool inline ALWAYS_INLINE sliceHasImplSubstr(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool sliceHasImplSubstr(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     if (second.size == 0)
         return true;
@@ -540,7 +541,7 @@ template <
     typename SecondSliceType,
     bool (*isEqual)(const FirstSliceType &, const SecondSliceType &, size_t, size_t),
     bool (*isEqualSecond)(const SecondSliceType &, size_t, size_t)>
-bool inline ALWAYS_INLINE sliceHasImpl(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
+bool sliceHasImpl(const FirstSliceType & first, const SecondSliceType & second, const UInt8 * first_null_map, const UInt8 * second_null_map)
 {
     if constexpr (search_type == ArraySearchType::Substr)
         return sliceHasImplSubstr<FirstSliceType, SecondSliceType, isEqual, isEqualSecond>(first, second, first_null_map, second_null_map);
@@ -550,7 +551,7 @@ bool inline ALWAYS_INLINE sliceHasImpl(const FirstSliceType & first, const Secon
 
 
 template <typename T, typename U>
-bool inline ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
+bool sliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
                         const NumericArraySlice<U> & second [[maybe_unused]],
                         size_t first_ind [[maybe_unused]],
                         size_t second_ind [[maybe_unused]])
@@ -565,13 +566,13 @@ bool inline ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> & first
 }
 
 template <typename T>
-bool inline ALWAYS_INLINE sliceEqualElements(const NumericArraySlice<T> &, const GenericArraySlice &, size_t, size_t)
+bool sliceEqualElements(const NumericArraySlice<T> &, const GenericArraySlice &, size_t, size_t)
 {
     return false;
 }
 
 template <typename U>
-bool inline ALWAYS_INLINE sliceEqualElements(const GenericArraySlice &, const NumericArraySlice<U> &, size_t, size_t)
+bool sliceEqualElements(const GenericArraySlice &, const NumericArraySlice<U> &, size_t, size_t)
 {
     return false;
 }
@@ -582,7 +583,7 @@ inline ALWAYS_INLINE bool sliceEqualElements(const GenericArraySlice & first, co
 }
 
 template <typename T>
-bool inline ALWAYS_INLINE insliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
+bool insliceEqualElements(const NumericArraySlice<T> & first [[maybe_unused]],
                           size_t first_ind [[maybe_unused]],
                           size_t second_ind [[maybe_unused]])
 {
@@ -597,14 +598,14 @@ inline ALWAYS_INLINE bool insliceEqualElements(const GenericArraySlice & first,
 }
 
 template <ArraySearchType search_type, typename T, typename U>
-bool inline ALWAYS_INLINE sliceHas(const NumericArraySlice<T> & first, const NumericArraySlice<U> & second)
+bool sliceHas(const NumericArraySlice<T> & first, const NumericArraySlice<U> & second)
 {
     auto impl = sliceHasImpl<search_type, NumericArraySlice<T>, NumericArraySlice<U>, sliceEqualElements<T, U>, insliceEqualElements<U>>;
     return impl(first, second, nullptr, nullptr);
 }
 
 template <ArraySearchType search_type>
-bool inline ALWAYS_INLINE sliceHas(const GenericArraySlice & first, const GenericArraySlice & second)
+bool sliceHas(const GenericArraySlice & first, const GenericArraySlice & second)
 {
     /// Generic arrays should have the same type in order to use column.compareAt(...)
     if (!first.elements->structureEquals(*second.elements))
@@ -615,19 +616,19 @@ bool inline ALWAYS_INLINE sliceHas(const GenericArraySlice & first, const Generi
 }
 
 template <ArraySearchType search_type, typename U>
-bool inline ALWAYS_INLINE sliceHas(const GenericArraySlice & /*first*/, const NumericArraySlice<U> & /*second*/)
+bool sliceHas(const GenericArraySlice & /*first*/, const NumericArraySlice<U> & /*second*/)
 {
     return false;
 }
 
 template <ArraySearchType search_type, typename T>
-bool inline ALWAYS_INLINE sliceHas(const NumericArraySlice<T> & /*first*/, const GenericArraySlice & /*second*/)
+bool sliceHas(const NumericArraySlice<T> & /*first*/, const GenericArraySlice & /*second*/)
 {
     return false;
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool inline ALWAYS_INLINE sliceHas(const FirstArraySlice & first, NullableSlice<SecondArraySlice> & second)
+bool sliceHas(const FirstArraySlice & first, NullableSlice<SecondArraySlice> & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -639,7 +640,7 @@ bool inline ALWAYS_INLINE sliceHas(const FirstArraySlice & first, NullableSlice<
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool inline ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, SecondArraySlice & second)
+bool sliceHas(const NullableSlice<FirstArraySlice> & first, SecondArraySlice & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -651,7 +652,7 @@ bool inline ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first,
 }
 
 template <ArraySearchType search_type, typename FirstArraySlice, typename SecondArraySlice>
-bool inline ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first, NullableSlice<SecondArraySlice> & second)
+bool sliceHas(const NullableSlice<FirstArraySlice> & first, NullableSlice<SecondArraySlice> & second)
 {
     auto impl = sliceHasImpl<
         search_type,
@@ -663,7 +664,7 @@ bool inline ALWAYS_INLINE sliceHas(const NullableSlice<FirstArraySlice> & first,
 }
 
 template <ArraySearchType search_type, typename FirstSource, typename SecondSource>
-void inline ALWAYS_INLINE arrayAllAny(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
+void NO_INLINE arrayAllAny(FirstSource && first, SecondSource && second, ColumnUInt8 & result)
 {
     auto size = result.size();
     auto & data = result.getData();
@@ -676,7 +677,7 @@ void inline ALWAYS_INLINE arrayAllAny(FirstSource && first, SecondSource && seco
 }
 
 template <typename ArraySource, typename ValueSource, typename Sink>
-void inline ALWAYS_INLINE resizeDynamicSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const IColumn & size_column)
+void resizeDynamicSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const IColumn & size_column)
 {
     const auto * size_nullable = typeid_cast<const ColumnNullable *>(&size_column);
     const NullMap * size_null_map = size_nullable ? &size_nullable->getNullMapData() : nullptr;
@@ -735,7 +736,7 @@ void inline ALWAYS_INLINE resizeDynamicSize(ArraySource && array_source, ValueSo
 }
 
 template <typename ArraySource, typename ValueSource, typename Sink>
-void inline ALWAYS_INLINE resizeConstantSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const ssize_t size)
+void resizeConstantSize(ArraySource && array_source, ValueSource && value_source, Sink && sink, const ssize_t size)
 {
     while (!sink.isEnd())
     {

From d23244b3a5a1d4bc0264c0a061ae43cc70be378e Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <KochetovNicolai@users.noreply.github.com>
Date: Thu, 17 Sep 2020 12:45:06 +0300
Subject: [PATCH 325/341] Revert "Lower number of threads in binary build"

---
 docker/packager/binary/build.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/packager/binary/build.sh b/docker/packager/binary/build.sh
index 7c3de9aaebd..72adba5d762 100755
--- a/docker/packager/binary/build.sh
+++ b/docker/packager/binary/build.sh
@@ -18,7 +18,7 @@ ccache --zero-stats ||:
 ln -s /usr/lib/x86_64-linux-gnu/libOpenCL.so.1.0.0 /usr/lib/libOpenCL.so ||:
 rm -f CMakeCache.txt
 cmake --debug-trycompile --verbose=1 -DCMAKE_VERBOSE_MAKEFILE=1 -LA -DCMAKE_BUILD_TYPE=$BUILD_TYPE -DSANITIZE=$SANITIZER $CMAKE_FLAGS ..
-ninja -j $(($(nproc) / 2)) $NINJA_FLAGS clickhouse-bundle
+ninja $NINJA_FLAGS clickhouse-bundle
 mv ./programs/clickhouse* /output
 mv ./src/unit_tests_dbms /output
 find . -name '*.so' -print -exec mv '{}' /output \;

From fdeda8200b9a398a7dd40e4e2f558adfea2b999c Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Thu, 17 Sep 2020 12:52:15 +0300
Subject: [PATCH 326/341] Revert debian/rules

---
 debian/rules | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/debian/rules b/debian/rules
index ffe1f9e1228..5b271a8691f 100755
--- a/debian/rules
+++ b/debian/rules
@@ -18,7 +18,7 @@ ifeq ($(CCACHE_PREFIX),distcc)
     THREADS_COUNT=$(shell distcc -j)
 endif
 ifeq ($(THREADS_COUNT),)
-    THREADS_COUNT=$(shell echo $$(( $$(nproc || grep -c ^processor /proc/cpuinfo || sysctl -n hw.ncpu || echo 8) / 2 )) )
+    THREADS_COUNT=$(shell nproc || grep -c ^processor /proc/cpuinfo || sysctl -n hw.ncpu || echo 4)
 endif
 DEB_BUILD_OPTIONS+=parallel=$(THREADS_COUNT)
 

From 36538ce08f0522f580e658873e5da5b2505e1e35 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Thu, 17 Sep 2020 13:00:51 +0300
Subject: [PATCH 327/341] Don't account for short queries, we'll deal with them
 separately.

New query:

```
WITH ceil(max(q[3]), 1) AS h
SELECT concat('sed -i s\'/^<test.*$/<test max_ignored_relative_change="', toString(h), '">/g\' tests/performance/', test, '.xml') AS s
FROM
(
    SELECT
        test,
        query_index,
        count(*),
        min(event_time),
        max(event_time) AS t,
        arrayMap(x -> floor(x, 3), quantiles(0, 0.5, 0.95, 1)(stat_threshold)) AS q,
        median(stat_threshold) AS m
    FROM perftest.query_metrics
    WHERE (metric = 'client_time') AND (abs(diff) < 0.05) AND (old > 0.2)
    GROUP BY
        test,
        query_index,
        query_display_name
    HAVING (t > '2020-09-01 00:00:00') AND (m > 0.1)
    ORDER BY test DESC
)
GROUP BY test
ORDER BY h DESC
FORMAT PrettySpace
```
---
 tests/performance/array_index_low_cardinality_strings.xml | 2 +-
 tests/performance/codecs_int_insert.xml                   | 2 +-
 tests/performance/cryptographic_hashes.xml                | 2 +-
 tests/performance/date_parsing.xml                        | 2 +-
 tests/performance/entropy.xml                             | 2 +-
 tests/performance/extract.xml                             | 2 +-
 tests/performance/general_purpose_hashes.xml              | 2 +-
 tests/performance/local_replica.xml                       | 2 +-
 tests/performance/order_by_single_column.xml              | 2 +-
 tests/performance/parallel_index.xml                      | 2 +-
 tests/performance/string_sort.xml                         | 2 +-
 tests/performance/uniq.xml                                | 2 +-
 tests/performance/website.xml                             | 2 +-
 13 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/tests/performance/array_index_low_cardinality_strings.xml b/tests/performance/array_index_low_cardinality_strings.xml
index bbfea083f0a..896a5923a9e 100644
--- a/tests/performance/array_index_low_cardinality_strings.xml
+++ b/tests/performance/array_index_low_cardinality_strings.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.2">
     <create_query>DROP TABLE IF EXISTS perf_lc_str</create_query>
     <create_query>CREATE TABLE perf_lc_str(
         str LowCardinality(String),
diff --git a/tests/performance/codecs_int_insert.xml b/tests/performance/codecs_int_insert.xml
index 0f2560b7134..662df80ae70 100644
--- a/tests/performance/codecs_int_insert.xml
+++ b/tests/performance/codecs_int_insert.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.5">
+<test max_ignored_relative_change="0.2">
     <settings>
         <allow_suspicious_codecs>1</allow_suspicious_codecs>
     </settings>
diff --git a/tests/performance/cryptographic_hashes.xml b/tests/performance/cryptographic_hashes.xml
index 97359d4ba97..03d275a7bb7 100644
--- a/tests/performance/cryptographic_hashes.xml
+++ b/tests/performance/cryptographic_hashes.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="1.3">
+<test max_ignored_relative_change="1.0">
     <substitutions>
         <substitution>
            <name>hash_slow</name>
diff --git a/tests/performance/date_parsing.xml b/tests/performance/date_parsing.xml
index ffe4ffb9799..15d267dbde5 100644
--- a/tests/performance/date_parsing.xml
+++ b/tests/performance/date_parsing.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <preconditions>
         <table_exists>hits_100m_single</table_exists>
     </preconditions>
diff --git a/tests/performance/entropy.xml b/tests/performance/entropy.xml
index 1707054a82f..6073ecef3e7 100644
--- a/tests/performance/entropy.xml
+++ b/tests/performance/entropy.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <preconditions>
         <table_exists>hits_100m_single</table_exists>
         <table_exists>hits_10m_single</table_exists>
diff --git a/tests/performance/extract.xml b/tests/performance/extract.xml
index b370152c7b2..49f60d12660 100644
--- a/tests/performance/extract.xml
+++ b/tests/performance/extract.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.4">
     <preconditions>
         <table_exists>test.hits</table_exists>
     </preconditions>
diff --git a/tests/performance/general_purpose_hashes.xml b/tests/performance/general_purpose_hashes.xml
index 31a1bd65835..cb99b564f17 100644
--- a/tests/performance/general_purpose_hashes.xml
+++ b/tests/performance/general_purpose_hashes.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.2">
+<test max_ignored_relative_change="0.3">
     <substitutions>
         <substitution>
            <name>gp_hash_func</name>
diff --git a/tests/performance/local_replica.xml b/tests/performance/local_replica.xml
index 4162cb631dd..5a979e82449 100644
--- a/tests/performance/local_replica.xml
+++ b/tests/performance/local_replica.xml
@@ -1,3 +1,3 @@
-<test>
+<test max_ignored_relative_change="0.3">
     <query>select sum(number) from remote('127.0.0.{{1|2}}', numbers_mt(1000000000)) group by bitAnd(number, 1)</query>
 </test>
diff --git a/tests/performance/order_by_single_column.xml b/tests/performance/order_by_single_column.xml
index 9b708ea393c..d58f3b5fff1 100644
--- a/tests/performance/order_by_single_column.xml
+++ b/tests/performance/order_by_single_column.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.5">
     <tags>
         <tag>sorting</tag>
         <tag>comparison</tag>
diff --git a/tests/performance/parallel_index.xml b/tests/performance/parallel_index.xml
index 5a8e4a405cc..78acf6001f0 100644
--- a/tests/performance/parallel_index.xml
+++ b/tests/performance/parallel_index.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.3">
+<test max_ignored_relative_change="0.2">
     <create_query>create table test_parallel_index (x UInt64, y UInt64, z UInt64, INDEX a (y) TYPE minmax GRANULARITY 2,
         INDEX b (z) TYPE set(8) GRANULARITY 2) engine = MergeTree order by x partition by bitAnd(x, 63 * 64) settings index_granularity = 4;</create_query>
 
diff --git a/tests/performance/string_sort.xml b/tests/performance/string_sort.xml
index 5d859398ece..e7d06d930be 100644
--- a/tests/performance/string_sort.xml
+++ b/tests/performance/string_sort.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.4">
     <preconditions>
         <table_exists>hits_10m_single</table_exists>
         <table_exists>hits_100m_single</table_exists>
diff --git a/tests/performance/uniq.xml b/tests/performance/uniq.xml
index b4e73733769..334a513ab1d 100644
--- a/tests/performance/uniq.xml
+++ b/tests/performance/uniq.xml
@@ -1,4 +1,4 @@
-<test>
+<test max_ignored_relative_change="0.9">
 
     <preconditions>
         <table_exists>hits_100m_single</table_exists>
diff --git a/tests/performance/website.xml b/tests/performance/website.xml
index 561b769bcde..65b3d79b5f1 100644
--- a/tests/performance/website.xml
+++ b/tests/performance/website.xml
@@ -1,4 +1,4 @@
-<test max_ignored_relative_change="0.6">
+<test max_ignored_relative_change="0.4">
 
     <preconditions>
         <table_exists>hits_10m_single</table_exists>

From ada1c7c4a03600de35f6031840dae25c9622025c Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Thu, 17 Sep 2020 13:15:46 +0300
Subject: [PATCH 328/341] fixup

---
 docker/test/performance-comparison/perf.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/performance-comparison/perf.py b/docker/test/performance-comparison/perf.py
index 64314c129b5..7966875f0f9 100755
--- a/docker/test/performance-comparison/perf.py
+++ b/docker/test/performance-comparison/perf.py
@@ -194,7 +194,7 @@ for conn_index, c in enumerate(connections):
 # Run the queries in randomized order, but preserve their indexes as specified
 # in the test XML. To avoid using too much time, limit the number of queries
 # we run per test.
-queries_to_run = random.sample(range(0, len(test_queries)), args.max_queries or len(test_queries))
+queries_to_run = random.sample(range(0, len(test_queries)), min(len(test_queries), args.max_queries or len(test_queries)))
 
 # Run test queries.
 for query_index in queries_to_run:

From bd92284b4e3dc43145a771dec292c1ffa0afbe78 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Thu, 17 Sep 2020 13:18:01 +0300
Subject: [PATCH 329/341] Push ci.

---
 src/Functions/GatherUtils/Algorithms.h | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Functions/GatherUtils/Algorithms.h b/src/Functions/GatherUtils/Algorithms.h
index 32501beebf0..79c003e2fd8 100644
--- a/src/Functions/GatherUtils/Algorithms.h
+++ b/src/Functions/GatherUtils/Algorithms.h
@@ -781,3 +781,4 @@ void resizeConstantSize(ArraySource && array_source, ValueSource && value_source
 }
 
 }
+

From 4773bf57eaab4b2890ff24e74616525d7b1ca571 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Thu, 17 Sep 2020 13:47:29 +0300
Subject: [PATCH 330/341] Use logical core id ('processor') for CPU freq metric

See https://github.com/ClickHouse/ClickHouse/issues/14923
---
 src/Interpreters/AsynchronousMetrics.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/AsynchronousMetrics.cpp b/src/Interpreters/AsynchronousMetrics.cpp
index ac71a88dc00..feb2036a0d6 100644
--- a/src/Interpreters/AsynchronousMetrics.cpp
+++ b/src/Interpreters/AsynchronousMetrics.cpp
@@ -332,7 +332,7 @@ void AsynchronousMetrics::update()
         ReadBufferFromFile buf("/proc/cpuinfo", 32768 /* buf_size */);
 
         // We need the following lines:
-        // core id : 4
+        // processor : 4
         // cpu MHz : 4052.941
         // They contain tabs and are interspersed with other info.
         int core_id = 0;
@@ -346,7 +346,7 @@ void AsynchronousMetrics::update()
             // It doesn't read the EOL itself.
             ++buf.position();
 
-            if (s.rfind("core id", 0) == 0)
+            if (s.rfind("processor", 0) == 0)
             {
                 if (auto colon = s.find_first_of(':'))
                 {

From a5560cd62dd9b6c058c71f0c9d72e11300b58a2d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Thu, 17 Sep 2020 14:27:17 +0300
Subject: [PATCH 331/341] Better drop replicated tables

---
 src/Storages/StorageReplicatedMergeTree.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 608d983a21e..d4bbb66df9e 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -697,7 +697,9 @@ void StorageReplicatedMergeTree::drop()
 
     if (has_metadata_in_zookeeper)
     {
-        auto zookeeper = tryGetZooKeeper();
+        /// Table can be shut down, restarting thread is not active
+        /// and calling StorageReplicatedMergeTree::getZooKeeper() won't suffice.
+        auto zookeeper = global_context.getZooKeeper();
 
         /// If probably there is metadata in ZooKeeper, we don't allow to drop the table.
         if (is_readonly || !zookeeper)

From 946d364b10626782d380a862d0067c7f6d0b6d01 Mon Sep 17 00:00:00 2001
From: Alexander Kuzmenkov <akuzm@yandex-team.ru>
Date: Thu, 17 Sep 2020 14:41:14 +0300
Subject: [PATCH 332/341] Move non-essential builds to special

Special builds have lower CI priority and start later. If some tests
fail, they won't start at all, so we'll save some CI time.
---
 tests/ci/ci_config.json | 24 ++++++++++++------------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/tests/ci/ci_config.json b/tests/ci/ci_config.json
index 034ed0ea3da..c69ef64b807 100644
--- a/tests/ci/ci_config.json
+++ b/tests/ci/ci_config.json
@@ -110,6 +110,18 @@
             "splitted": "unsplitted",
             "tidy": "disable",
             "with_coverage": false
+        }
+    ],
+    "special_build_config": [
+        {
+            "compiler": "clang-11",
+            "build-type": "debug",
+            "sanitizer": "",
+            "package-type": "deb",
+            "bundled": "bundled",
+            "splitted": "unsplitted",
+            "tidy": "enable",
+            "with_coverage": true
         },
         {
             "compiler": "clang-11",
@@ -152,18 +164,6 @@
             "with_coverage": false
         }
     ],
-    "special_build_config": [
-        {
-            "compiler": "clang-11",
-            "build-type": "debug",
-            "sanitizer": "",
-            "package-type": "deb",
-            "bundled": "bundled",
-            "splitted": "unsplitted",
-            "tidy": "enable",
-            "with_coverage": true
-        }
-    ],
     "tests_config": {
         "Functional stateful tests (address)": {
             "required_build_properties": {

From 959d755a1bc0d7c3b0712f09de56cd19ad781096 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <KochetovNicolai@users.noreply.github.com>
Date: Thu, 17 Sep 2020 15:08:55 +0300
Subject: [PATCH 333/341] Update Visitor.h

---
 src/Common/Visitor.h | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Common/Visitor.h b/src/Common/Visitor.h
index 26ee66681e9..48e9abe1341 100644
--- a/src/Common/Visitor.h
+++ b/src/Common/Visitor.h
@@ -162,8 +162,6 @@ class Visitable : public Base
 {
 public:
     void accept(Visitor & visitor) override { visitor.visit(*static_cast<Derived *>(this)); }
-
-    //virtual ~Visitable() = default;
 };
 
 }

From 22bd22702e7b68e0182c81abc6e4a2820f8a1132 Mon Sep 17 00:00:00 2001
From: Mikhail Filimonov <mfilimonov@altinity.com>
Date: Thu, 17 Sep 2020 15:59:14 +0200
Subject: [PATCH 334/341] Fix enable_optimize_predicate_expression for
 finalizeAggregation

finalizeAggregation was wrongly marked as stateful, preventing pushing the conditions down.
---
 src/Functions/finalizeAggregation.cpp         |  5 ---
 .../00808_not_optimize_predicate.reference    | 17 +++++++++
 .../00808_not_optimize_predicate.sql          | 36 +++++++++++++++++++
 3 files changed, 53 insertions(+), 5 deletions(-)

diff --git a/src/Functions/finalizeAggregation.cpp b/src/Functions/finalizeAggregation.cpp
index 51afb4729dc..ae2a67dec20 100644
--- a/src/Functions/finalizeAggregation.cpp
+++ b/src/Functions/finalizeAggregation.cpp
@@ -34,11 +34,6 @@ public:
         return name;
     }
 
-    bool isStateful() const override
-    {
-        return true;
-    }
-
     size_t getNumberOfArguments() const override
     {
         return 1;
diff --git a/tests/queries/0_stateless/00808_not_optimize_predicate.reference b/tests/queries/0_stateless/00808_not_optimize_predicate.reference
index 1899fa2045d..d8ab9425aab 100644
--- a/tests/queries/0_stateless/00808_not_optimize_predicate.reference
+++ b/tests/queries/0_stateless/00808_not_optimize_predicate.reference
@@ -10,3 +10,20 @@
 (1,1)
 (3,2)
 (5,2)
+-------finalizeAggregation should not be stateful (issue #14847)-------
+2	62
+3	87
+4	112
+5	137
+SELECT
+    n,
+    `finalizeAggregation(s)`
+FROM 
+(
+    SELECT
+        n,
+        finalizeAggregation(s)
+    FROM test_00808_push_down_with_finalizeAggregation
+    WHERE (n <= 5) AND (n >= 2)
+)
+WHERE (n >= 2) AND (n <= 5)
diff --git a/tests/queries/0_stateless/00808_not_optimize_predicate.sql b/tests/queries/0_stateless/00808_not_optimize_predicate.sql
index ad3df16e4bb..579fd00cb8c 100644
--- a/tests/queries/0_stateless/00808_not_optimize_predicate.sql
+++ b/tests/queries/0_stateless/00808_not_optimize_predicate.sql
@@ -36,3 +36,39 @@ SELECT arrayJoin(arrayMap(x -> x, arraySort(groupArray((ts, n))))) AS k FROM (
 
 
 DROP TABLE IF EXISTS test_00808;
+
+SELECT '-------finalizeAggregation should not be stateful (issue #14847)-------';
+
+DROP TABLE IF EXISTS test_00808_push_down_with_finalizeAggregation;
+
+CREATE TABLE test_00808_push_down_with_finalizeAggregation ENGINE = AggregatingMergeTree
+ORDER BY n AS
+SELECT
+    intDiv(number, 25) AS n,
+    avgState(number) AS s
+FROM numbers(2500)
+GROUP BY n;
+
+SET force_primary_key = 1, enable_debug_queries = 1, enable_optimize_predicate_expression = 1;
+
+SELECT *
+FROM
+(
+    SELECT
+        n,
+        finalizeAggregation(s)
+    FROM test_00808_push_down_with_finalizeAggregation
+)
+WHERE (n >= 2) AND (n <= 5);
+
+ANALYZE SELECT *
+FROM
+(
+    SELECT
+        n,
+        finalizeAggregation(s)
+    FROM test_00808_push_down_with_finalizeAggregation
+)
+WHERE (n >= 2) AND (n <= 5);
+
+DROP TABLE IF EXISTS test_00808_push_down_with_finalizeAggregation;

From c156c0f28fee321c3b4c6d686b5fe56243f64adb Mon Sep 17 00:00:00 2001
From: yulu86 <xuyulu86@126.com>
Date: Thu, 17 Sep 2020 22:54:28 +0800
Subject: [PATCH 335/341] modify syntax

---
 docs/zh/sql-reference/functions/conditional-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/zh/sql-reference/functions/conditional-functions.md b/docs/zh/sql-reference/functions/conditional-functions.md
index eabe253ab1c..265c4387cb1 100644
--- a/docs/zh/sql-reference/functions/conditional-functions.md
+++ b/docs/zh/sql-reference/functions/conditional-functions.md
@@ -34,7 +34,7 @@
     │ 2 │    3 │
     └───┴──────┘
 
-执行查询 `SELECT multiIf(isNull(y) x, y < 3, y, NULL) FROM t_null`。结果：
+执行查询 `SELECT multiIf(isNull(y), x, y < 3, y, NULL) FROM t_null`。结果：
 
     ┌─multiIf(isNull(y), x, less(y, 3), y, NULL)─┐
     │                                          1 │

From eab11e35cd93d992283fbff3e401c76f24b31ece Mon Sep 17 00:00:00 2001
From: yulu86 <xuyulu86@126.com>
Date: Thu, 17 Sep 2020 22:58:20 +0800
Subject: [PATCH 336/341] modify title of aggragate functions in Chinese

---
 docs/zh/sql-reference/aggregate-functions/index.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/zh/sql-reference/aggregate-functions/index.md b/docs/zh/sql-reference/aggregate-functions/index.md
index 57d8e362d99..436a8f433ea 100644
--- a/docs/zh/sql-reference/aggregate-functions/index.md
+++ b/docs/zh/sql-reference/aggregate-functions/index.md
@@ -1,6 +1,6 @@
 ---
 toc_priority: 33
-toc_title: 简介
+toc_title: 聚合函数
 ---
 
 # 聚合函数 {#aggregate-functions}

From 06ff6d2eda5f0dfc12c6fb13101aa062a0e15ede Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Thu, 17 Sep 2020 18:54:41 +0300
Subject: [PATCH 337/341] better 01193_metadata_loading

---
 .../01193_metadata_loading.reference          |  4 +-
 .../0_stateless/01193_metadata_loading.sh     | 38 +++++++++----------
 2 files changed, 20 insertions(+), 22 deletions(-)

diff --git a/tests/queries/0_stateless/01193_metadata_loading.reference b/tests/queries/0_stateless/01193_metadata_loading.reference
index 8ff246325ac..9789cbf33ba 100644
--- a/tests/queries/0_stateless/01193_metadata_loading.reference
+++ b/tests/queries/0_stateless/01193_metadata_loading.reference
@@ -1,5 +1,5 @@
-10000	0	2020-06-25	hello	[1,2]	[3,4]
-10000	1	2020-06-26	word	[10,20]	[30,40]
+1000	0	2020-06-25	hello	[1,2]	[3,4]
+1000	1	2020-06-26	word	[10,20]	[30,40]
 ok
 8000	0	2020-06-25	hello	[1,2]	[3,4]
 8000	1	2020-06-26	word	[10,20]	[30,40]
diff --git a/tests/queries/0_stateless/01193_metadata_loading.sh b/tests/queries/0_stateless/01193_metadata_loading.sh
index c16726209a3..0ee583a7265 100755
--- a/tests/queries/0_stateless/01193_metadata_loading.sh
+++ b/tests/queries/0_stateless/01193_metadata_loading.sh
@@ -6,14 +6,6 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # it is the worst way of making performance test, nevertheless it can detect significant slowdown and some other issues, that usually found by stress test
 
 db="test_01193_$RANDOM"
-
-declare -A engines
-engines[0]="Memory"
-engines[1]="File(CSV)"
-engines[2]="Log"
-engines[3]="StripeLog"
-engines[4]="MergeTree ORDER BY i"
-
 tables=1000
 threads=10
 count_multiplier=1
@@ -24,11 +16,17 @@ debug_or_sanitizer_build=$($CLICKHOUSE_CLIENT -q "WITH ((SELECT value FROM syste
 if [[ debug_or_sanitizer_build -eq 1 ]]; then tables=100; count_multiplier=10; max_time_ms=1500; fi
 
 create_tables() {
-  for i in $(seq 1 $tables); do
-    engine=${engines[$((i % ${#engines[@]}))]}
-    $CLICKHOUSE_CLIENT -q "CREATE TABLE $db.table_$1_$i (i UInt64, d Date, s String, n Nested(i UInt8, f Float32)) ENGINE=$engine"
-    $CLICKHOUSE_CLIENT -q "INSERT INTO $db.table_$1_$i VALUES (0, '2020-06-25', 'hello', [1, 2], [3, 4]), (1, '2020-06-26', 'word', [10, 20], [30, 40])"
-  done
+  $CLICKHOUSE_CLIENT -q "WITH
+          'CREATE TABLE $db.table_$1_' AS create1,
+          ' (i UInt64, d Date, s String, n Nested(i UInt8, f Float32)) ENGINE=' AS create2,
+          ['Memory', 'File(CSV)', 'Log', 'StripeLog', 'MergeTree ORDER BY i'] AS engines,
+          'INSERT INTO $db.table_$1_' AS insert1,
+          ' VALUES (0, ''2020-06-25'', ''hello'', [1, 2], [3, 4]), (1, ''2020-06-26'', ''word'', [10, 20], [30, 40])' AS insert2
+      SELECT arrayStringConcat(
+          groupArray(
+              create1 || toString(number) || create2 || engines[1 + number % length(engines)] || ';\n' ||
+              insert1 ||  toString(number) || insert2
+          ), ';\n') FROM numbers($tables) FORMAT TSVRaw;" | $CLICKHOUSE_CLIENT -nm
 }
 
 $CLICKHOUSE_CLIENT -q "CREATE DATABASE $db"
@@ -39,15 +37,15 @@ done
 wait
 
 $CLICKHOUSE_CLIENT -q "CREATE TABLE $db.table_merge (i UInt64, d Date, s String, n Nested(i UInt8, f Float32)) ENGINE=Merge('$db', '^table_')"
-$CLICKHOUSE_CLIENT -q "SELECT count() * $count_multiplier, i, d, s, n.i, n.f FROM $db.table_merge GROUP BY i, d, s, n.i, n.f ORDER BY i"
+$CLICKHOUSE_CLIENT -q "SELECT count() * $count_multiplier, i, d, s, n.i, n.f FROM merge('$db', '^table_9') GROUP BY i, d, s, n.i, n.f ORDER BY i"
 
-$CLICKHOUSE_CLIENT -q "DETACH DATABASE $db"
+for i in {1..5}; do
+  $CLICKHOUSE_CLIENT -q "DETACH DATABASE $db"
+  $CLICKHOUSE_CLIENT -q "ATTACH DATABASE $db" --query_id="$db-$i";
+done
 
-# get real time, grep seconds, remove point, remove leading zeros
-elapsed_ms=$({ time $CLICKHOUSE_CLIENT -q "ATTACH DATABASE $db"; } 2>&1 | grep real | grep -Po "0m\K[0-9\.]*" | tr -d '.' | sed "s/^0*//")
-$CLICKHOUSE_CLIENT -q "SELECT '01193_metadata_loading', $elapsed_ms FORMAT Null" # it will be printed to server log
-
-if [[ $elapsed_ms -le $max_time_ms ]]; then echo ok; fi
+$CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
+$CLICKHOUSE_CLIENT -q "SELECT if(quantile(0.5)(query_duration_ms) < $max_time_ms, 'ok', toString(groupArray(query_duration_ms))) FROM system.query_log WHERE query_id LIKE '$db-%' AND type=2"
 
 $CLICKHOUSE_CLIENT -q "SELECT count() * $count_multiplier, i, d, s, n.i, n.f FROM $db.table_merge GROUP BY i, d, s, n.i, n.f ORDER BY i"
 

From 20d07ed405239592b06f24bd6f965c3651525dc8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Thu, 17 Sep 2020 21:04:11 +0300
Subject: [PATCH 338/341] Update comment

---
 src/Common/ThreadFuzzer.h | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/Common/ThreadFuzzer.h b/src/Common/ThreadFuzzer.h
index d0693945cb0..dabf6209f67 100644
--- a/src/Common/ThreadFuzzer.h
+++ b/src/Common/ThreadFuzzer.h
@@ -31,10 +31,8 @@ namespace DB
   *
   * Notes:
   * - it can be also implemented with instrumentation (example: LLVM Xray) instead of signals.
-  * - it's also reasonable to insert glitches around interesting functions (example: mutex lock/unlock, starting of threads, etc.),
-  *   it is doable with wrapping these functions (todo).
   * - we should also make the sleep time random.
-  * - sleep obviously helps, but the effect of yield and migration is unclear.
+  * - sleep and migration obviously helps, but the effect of yield is unclear.
   *
   * In addition, we allow to inject glitches around thread synchronization functions.
   * Example:

From 0597ad315079bc39da20a8296503e717904d46db Mon Sep 17 00:00:00 2001
From: tavplubix <avtokmakov@yandex-team.ru>
Date: Thu, 17 Sep 2020 21:47:21 +0300
Subject: [PATCH 339/341] fix typo

---
 src/Databases/DatabaseAtomic.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Databases/DatabaseAtomic.cpp b/src/Databases/DatabaseAtomic.cpp
index 8f4a4522c59..e0f72436422 100644
--- a/src/Databases/DatabaseAtomic.cpp
+++ b/src/Databases/DatabaseAtomic.cpp
@@ -302,7 +302,7 @@ void DatabaseAtomic::assertDetachedTableNotInUse(const UUID & uuid)
     /// To avoid it, we remember UUIDs of detached tables and does not allow ATTACH table with such UUID until detached instance still in use.
     if (detached_tables.count(uuid))
         throw Exception("Cannot attach table with UUID " + toString(uuid) +
-              ", because it was detached but still used by come query. Retry later.", ErrorCodes::TABLE_ALREADY_EXISTS);
+              ", because it was detached but still used by some query. Retry later.", ErrorCodes::TABLE_ALREADY_EXISTS);
 }
 
 DatabaseAtomic::DetachedTables DatabaseAtomic::cleenupDetachedTables()

From 748fb74de268849acabab2ec59c54f8d035575b9 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 18 Sep 2020 10:02:55 +0300
Subject: [PATCH 340/341] Fix build type for integration tests

---
 tests/ci/ci_config.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/ci_config.json b/tests/ci/ci_config.json
index c69ef64b807..220d8d801ec 100644
--- a/tests/ci/ci_config.json
+++ b/tests/ci/ci_config.json
@@ -431,7 +431,7 @@
         },
         "Integration tests (release)": {
             "required_build_properties": {
-                "compiler": "clang-11",
+                "compiler": "gcc-10",
                 "package_type": "deb",
                 "build_type": "relwithdebuginfo",
                 "sanitizer": "none",

From 0520b05001d0a72d72bce9a83fcba0d9dcf2acf3 Mon Sep 17 00:00:00 2001
From: Artem Zuikov <chertus@gmail.com>
Date: Fri, 18 Sep 2020 12:51:44 +0300
Subject: [PATCH 341/341] Speedup wide integers (#14859)

---
 base/common/wide_integer.h                    |   6 +-
 base/common/wide_integer_impl.h               | 656 +++++++++---------
 .../01440_big_int_exotic_casts.reference      | 292 ++++++++
 .../01440_big_int_exotic_casts.sql            |  48 ++
 4 files changed, 662 insertions(+), 340 deletions(-)
 create mode 100644 tests/queries/0_stateless/01440_big_int_exotic_casts.reference
 create mode 100644 tests/queries/0_stateless/01440_big_int_exotic_casts.sql

diff --git a/base/common/wide_integer.h b/base/common/wide_integer.h
index 2aeac072b3f..61d88bdcaf3 100644
--- a/base/common/wide_integer.h
+++ b/base/common/wide_integer.h
@@ -54,8 +54,8 @@ template <size_t Bits, typename Signed>
 class integer
 {
 public:
-    using base_type = uint8_t;
-    using signed_base_type = int8_t;
+    using base_type = uint64_t;
+    using signed_base_type = int64_t;
 
     // ctors
     integer() = default;
@@ -127,7 +127,7 @@ private:
     friend class std::numeric_limits<integer<Bits, signed>>;
     friend class std::numeric_limits<integer<Bits, unsigned>>;
 
-    base_type m_arr[_impl::arr_size];
+    base_type items[_impl::item_count];
 };
 
 template <typename T>
diff --git a/base/common/wide_integer_impl.h b/base/common/wide_integer_impl.h
index 26bd6704bdc..5673ac46c4a 100644
--- a/base/common/wide_integer_impl.h
+++ b/base/common/wide_integer_impl.h
@@ -3,10 +3,6 @@
 
 #include "throwError.h"
 
-#ifndef CHAR_BIT
-#define CHAR_BIT 8
-#endif
-
 namespace wide
 {
 
@@ -74,7 +70,7 @@ public:
         {
             using T = wide::integer<Bits, signed>;
             T res{};
-            res.m_arr[T::_impl::big(0)] = std::numeric_limits<typename wide::integer<Bits, Signed>::signed_base_type>::min();
+            res.items[T::_impl::big(0)] = std::numeric_limits<typename wide::integer<Bits, Signed>::signed_base_type>::min();
             return res;
         }
         return 0;
@@ -84,12 +80,12 @@ public:
     {
         using T = wide::integer<Bits, Signed>;
         T res{};
-        res.m_arr[T::_impl::big(0)] = is_same<Signed, signed>::value
+        res.items[T::_impl::big(0)] = is_same<Signed, signed>::value
             ? std::numeric_limits<typename wide::integer<Bits, Signed>::signed_base_type>::max()
             : std::numeric_limits<typename wide::integer<Bits, Signed>::base_type>::max();
-        for (int i = 1; i < wide::integer<Bits, Signed>::_impl::arr_size; ++i)
+        for (unsigned i = 1; i < wide::integer<Bits, Signed>::_impl::item_count; ++i)
         {
-            res.m_arr[T::_impl::big(i)] = std::numeric_limits<typename wide::integer<Bits, Signed>::base_type>::max();
+            res.items[T::_impl::big(i)] = std::numeric_limits<typename wide::integer<Bits, Signed>::base_type>::max();
         }
         return res;
     }
@@ -147,28 +143,45 @@ namespace wide
 template <size_t Bits, typename Signed>
 struct integer<Bits, Signed>::_impl
 {
-    static_assert(Bits % CHAR_BIT == 0, "=)");
-
-    // utils
-    static const int base_bits = sizeof(base_type) * CHAR_BIT;
-    static const int arr_size = Bits / base_bits;
     static constexpr size_t _Bits = Bits;
-    static constexpr bool _is_wide_integer = true;
+    static constexpr const unsigned byte_count = Bits / 8;
+    static constexpr const unsigned item_count = byte_count / sizeof(base_type);
+    static constexpr const unsigned base_bits = sizeof(base_type) * 8;
 
-    // The original implementation is big-endian. We need little one.
+    static_assert(Bits % base_bits == 0);
+
+    /// Simple iteration in both directions
     static constexpr unsigned little(unsigned idx) { return idx; }
-    static constexpr unsigned big(unsigned idx) { return arr_size - 1 - idx; }
+    static constexpr unsigned big(unsigned idx) { return item_count - 1 - idx; }
     static constexpr unsigned any(unsigned idx) { return idx; }
 
+    template <class T>
+    constexpr static bool is_negative(const T & n) noexcept
+    {
+        if constexpr (std::is_signed_v<T>)
+            return n < 0;
+        else
+            return false;
+    }
+
     template <size_t B, class T>
     constexpr static bool is_negative(const integer<B, T> & n) noexcept
     {
         if constexpr (std::is_same_v<T, signed>)
-            return static_cast<signed_base_type>(n.m_arr[big(0)]) < 0;
+            return static_cast<signed_base_type>(n.items[big(0)]) < 0;
         else
             return false;
     }
 
+    template <typename T>
+    constexpr static auto make_positive(const T & n) noexcept
+    {
+        if constexpr (std::is_signed_v<T>)
+            return n < 0 ? -n : n;
+        else
+            return n;
+    }
+
     template <size_t B, class S>
     constexpr static integer<B, S> make_positive(const integer<B, S> & n) noexcept
     {
@@ -189,21 +202,24 @@ struct integer<Bits, Signed>::_impl
     template <typename Integral>
     constexpr static void wide_integer_from_bultin(integer<Bits, Signed> & self, Integral rhs) noexcept
     {
-        auto r = _impl::to_Integral(rhs);
+        self.items[0] = _impl::to_Integral(rhs);
+        if constexpr (std::is_same_v<Integral, __int128>)
+            self.items[1] = rhs >> base_bits;
 
-        int r_idx = 0;
-        for (; static_cast<size_t>(r_idx) < sizeof(Integral) && r_idx < arr_size; ++r_idx)
+        constexpr const unsigned start = (sizeof(Integral) == 16) ? 2 : 1;
+
+        if constexpr (std::is_signed_v<Integral>)
         {
-            base_type & curr = self.m_arr[little(r_idx)];
-            base_type curr_rhs = (r >> (r_idx * CHAR_BIT)) & std::numeric_limits<base_type>::max();
-            curr = curr_rhs;
+            if (rhs < 0)
+            {
+                for (unsigned i = start; i < item_count; ++i)
+                    self.items[i] = -1;
+                return;
+            }
         }
 
-        for (; r_idx < arr_size; ++r_idx)
-        {
-            base_type & curr = self.m_arr[little(r_idx)];
-            curr = r < 0 ? std::numeric_limits<base_type>::max() : 0;
-        }
+        for (unsigned i = start; i < item_count; ++i)
+            self.items[i] = 0;
     }
 
     constexpr static void wide_integer_from_bultin(integer<Bits, Signed> & self, double rhs) noexcept
@@ -234,170 +250,142 @@ struct integer<Bits, Signed>::_impl
     constexpr static void
     wide_integer_from_wide_integer(integer<Bits, Signed> & self, const integer<Bits2, Signed2> & rhs) noexcept
     {
-        //        int Bits_to_copy = std::min(arr_size, rhs.arr_size);
-        auto rhs_arr_size = integer<Bits2, Signed2>::_impl::arr_size;
-        int base_elems_to_copy = _impl::arr_size < rhs_arr_size ? _impl::arr_size : rhs_arr_size;
-        for (int i = 0; i < base_elems_to_copy; ++i)
+        constexpr const unsigned min_bits = (Bits < Bits2) ? Bits : Bits2;
+        constexpr const unsigned to_copy = min_bits / base_bits;
+
+        for (unsigned i = 0; i < to_copy; ++i)
+            self.items[i] = rhs.items[i];
+
+        if constexpr (Bits > Bits2)
         {
-            self.m_arr[little(i)] = rhs.m_arr[little(i)];
-        }
-        for (int i = 0; i < arr_size - base_elems_to_copy; ++i)
-        {
-            self.m_arr[big(i)] = is_negative(rhs) ? std::numeric_limits<base_type>::max() : 0;
+            if constexpr (std::is_signed_v<Signed2>)
+            {
+                if (rhs < 0)
+                {
+                    for (unsigned i = to_copy; i < item_count; ++i)
+                        self.items[i] = -1;
+                    return;
+                }
+            }
+
+            for (unsigned i = to_copy; i < item_count; ++i)
+                self.items[i] = 0;
         }
     }
 
     template <typename T>
     constexpr static bool should_keep_size()
     {
-        return sizeof(T) * CHAR_BIT <= Bits;
+        return sizeof(T) <= byte_count;
     }
 
-    constexpr static integer<Bits, unsigned> shift_left(const integer<Bits, unsigned> & rhs, int n) noexcept
+    constexpr static integer<Bits, Signed> shift_left(const integer<Bits, Signed> & rhs, unsigned n) noexcept
     {
-        if (static_cast<size_t>(n) >= base_bits * arr_size)
-            return 0;
-        if (n <= 0)
-            return rhs;
+        integer<Bits, Signed> lhs;
+        unsigned items_shift = n / base_bits;
 
-        integer<Bits, Signed> lhs = rhs;
-        int bit_shift = n % base_bits;
-        unsigned n_bytes = n / base_bits;
-        if (bit_shift)
+        if (unsigned bit_shift = n % base_bits)
         {
-            lhs.m_arr[big(0)] <<= bit_shift;
-            for (int i = 1; i < arr_size; ++i)
+            unsigned overflow_shift = base_bits - bit_shift;
+
+            lhs.items[big(0)] = rhs.items[big(items_shift)] << bit_shift;
+            for (unsigned i = 1; i < item_count - items_shift; ++i)
             {
-                lhs.m_arr[big(i - 1)] |= lhs.m_arr[big(i)] >> (base_bits - bit_shift);
-                lhs.m_arr[big(i)] <<= bit_shift;
+                lhs.items[big(i - 1)] |= rhs.items[big(items_shift + i)] >> overflow_shift;
+                lhs.items[big(i)] = rhs.items[big(items_shift + i)] << bit_shift;
             }
         }
-        if (n_bytes)
-        {
-            for (unsigned i = 0; i < arr_size - n_bytes; ++i)
-            {
-                lhs.m_arr[big(i)] = lhs.m_arr[big(i + n_bytes)];
-            }
-            for (unsigned i = arr_size - n_bytes; i < arr_size; ++i)
-                lhs.m_arr[big(i)] = 0;
-        }
-        return lhs;
-    }
-
-    constexpr static integer<Bits, signed> shift_left(const integer<Bits, signed> & rhs, int n) noexcept
-    {
-        return integer<Bits, signed>(shift_left(integer<Bits, unsigned>(rhs), n));
-    }
-
-    constexpr static integer<Bits, unsigned> shift_right(const integer<Bits, unsigned> & rhs, int n) noexcept
-    {
-        if (static_cast<size_t>(n) >= base_bits * arr_size)
-            return 0;
-        if (n <= 0)
-            return rhs;
-
-        integer<Bits, Signed> lhs = rhs;
-        int bit_shift = n % base_bits;
-        unsigned n_bytes = n / base_bits;
-        if (bit_shift)
-        {
-            lhs.m_arr[little(0)] >>= bit_shift;
-            for (int i = 1; i < arr_size; ++i)
-            {
-                lhs.m_arr[little(i - 1)] |= lhs.m_arr[little(i)] << (base_bits - bit_shift);
-                lhs.m_arr[little(i)] >>= bit_shift;
-            }
-        }
-        if (n_bytes)
-        {
-            for (unsigned i = 0; i < arr_size - n_bytes; ++i)
-            {
-                lhs.m_arr[little(i)] = lhs.m_arr[little(i + n_bytes)];
-            }
-            for (unsigned i = arr_size - n_bytes; i < arr_size; ++i)
-                lhs.m_arr[little(i)] = 0;
-        }
-        return lhs;
-    }
-
-    constexpr static integer<Bits, signed> shift_right(const integer<Bits, signed> & rhs, int n) noexcept
-    {
-        if (static_cast<size_t>(n) >= base_bits * arr_size)
-            return 0;
-        if (n <= 0)
-            return rhs;
-
-        bool is_neg = is_negative(rhs);
-        if (!is_neg)
-            return shift_right(integer<Bits, unsigned>(rhs), n);
-
-        integer<Bits, Signed> lhs = rhs;
-        int bit_shift = n % base_bits;
-        unsigned n_bytes = n / base_bits;
-        if (bit_shift)
-        {
-            lhs = shift_right(integer<Bits, unsigned>(lhs), bit_shift);
-            lhs.m_arr[big(0)] |= std::numeric_limits<base_type>::max() << (base_bits - bit_shift);
-        }
-        if (n_bytes)
-        {
-            for (unsigned i = 0; i < arr_size - n_bytes; ++i)
-            {
-                lhs.m_arr[little(i)] = lhs.m_arr[little(i + n_bytes)];
-            }
-            for (unsigned i = arr_size - n_bytes; i < arr_size; ++i)
-            {
-                lhs.m_arr[little(i)] = std::numeric_limits<base_type>::max();
-            }
-        }
-        return lhs;
-    }
-
-    template <typename T>
-    constexpr static integer<Bits, Signed>
-    operator_plus_T(const integer<Bits, Signed> & lhs, T rhs) noexcept(std::is_same_v<Signed, unsigned>)
-    {
-        if (rhs < 0)
-            return _operator_minus_T(lhs, -rhs);
         else
-            return _operator_plus_T(lhs, rhs);
+        {
+            for (unsigned i = 0; i < item_count - items_shift; ++i)
+                lhs.items[big(i)] = rhs.items[big(items_shift + i)];
+        }
+
+        for (unsigned i = 0; i < items_shift; ++i)
+            lhs.items[little(i)] = 0;
+        return lhs;
+    }
+
+    constexpr static integer<Bits, Signed> shift_right(const integer<Bits, Signed> & rhs, unsigned n) noexcept
+    {
+        integer<Bits, Signed> lhs;
+        unsigned items_shift = n / base_bits;
+        unsigned bit_shift = n % base_bits;
+
+        if (bit_shift)
+        {
+            unsigned overflow_shift = base_bits - bit_shift;
+
+            lhs.items[little(0)] = rhs.items[little(items_shift)] >> bit_shift;
+            for (unsigned i = 1; i < item_count - items_shift; ++i)
+            {
+                lhs.items[little(i - 1)] |= rhs.items[little(items_shift + i)] << overflow_shift;
+                lhs.items[little(i)] = rhs.items[little(items_shift + i)] >> bit_shift;
+            }
+        }
+        else
+        {
+            for (unsigned i = 0; i < item_count - items_shift; ++i)
+                lhs.items[little(i)] = rhs.items[little(items_shift + i)];
+        }
+
+        if (is_negative(rhs))
+        {
+            if (bit_shift)
+                lhs.items[big(items_shift)] |= std::numeric_limits<base_type>::max() << (base_bits - bit_shift);
+
+            for (unsigned i = item_count - items_shift; i < items_shift; ++i)
+                lhs.items[little(i)] = std::numeric_limits<base_type>::max();
+        }
+        else
+        {
+            for (unsigned i = item_count - items_shift; i < items_shift; ++i)
+                lhs.items[little(i)] = 0;
+        }
+
+        return lhs;
     }
 
 private:
     template <typename T>
-    constexpr static integer<Bits, Signed>
-    _operator_minus_T(const integer<Bits, Signed> & lhs, T rhs) noexcept(std::is_same_v<Signed, unsigned>)
+    constexpr static base_type get_item(const T & x, unsigned number)
     {
-        integer<Bits, Signed> res = lhs;
+        if constexpr (IsWideInteger<T>::value)
+        {
+            if (number < T::_impl::item_count)
+                return x.items[number];
+            return 0;
+        }
+        else
+        {
+            if (number * sizeof(base_type) < sizeof(T))
+                return x >> (number * base_bits); // & std::numeric_limits<base_type>::max()
+            return 0;
+        }
+    }
+
+    template <typename T>
+    constexpr static integer<Bits, Signed>
+    op_minus(const integer<Bits, Signed> & lhs, T rhs)
+    {
+        integer<Bits, Signed> res;
 
         bool is_underflow = false;
-        int r_idx = 0;
-        for (; static_cast<size_t>(r_idx) < sizeof(T) && r_idx < arr_size; ++r_idx)
+        for (unsigned i = 0; i < item_count; ++i)
         {
-            base_type & res_i = res.m_arr[little(r_idx)];
-            base_type curr_rhs = (rhs >> (r_idx * CHAR_BIT)) & std::numeric_limits<base_type>::max();
+            base_type lhs_item = lhs.items[little(i)];
+            base_type rhs_item = get_item(rhs, i);
 
             if (is_underflow)
             {
-                --res_i;
-                is_underflow = res_i == std::numeric_limits<base_type>::max();
+                is_underflow = (lhs_item == 0);
+                --lhs_item;
             }
 
-            if (res_i < curr_rhs)
+            if (lhs_item < rhs_item)
                 is_underflow = true;
-            res_i -= curr_rhs;
-        }
 
-        if (is_underflow && r_idx < arr_size)
-        {
-            --res.m_arr[little(r_idx)];
-            for (int i = arr_size - 1 - r_idx - 1; i >= 0; --i)
-            {
-                if (res.m_arr[big(i + 1)] == std::numeric_limits<base_type>::max())
-                    --res.m_arr[big(i)];
-                else
-                    break;
-            }
+            res.items[little(i)] = lhs_item - rhs_item;
         }
 
         return res;
@@ -405,37 +393,69 @@ private:
 
     template <typename T>
     constexpr static integer<Bits, Signed>
-    _operator_plus_T(const integer<Bits, Signed> & lhs, T rhs) noexcept(std::is_same_v<Signed, unsigned>)
+    op_plus(const integer<Bits, Signed> & lhs, T rhs)
     {
-        integer<Bits, Signed> res = lhs;
+        integer<Bits, Signed> res;
 
         bool is_overflow = false;
-        int r_idx = 0;
-        for (; static_cast<size_t>(r_idx) < sizeof(T) && r_idx < arr_size; ++r_idx)
+        for (unsigned i = 0; i < item_count; ++i)
         {
-            base_type & res_i = res.m_arr[little(r_idx)];
-            base_type curr_rhs = (rhs >> (r_idx * CHAR_BIT)) & std::numeric_limits<base_type>::max();
+            base_type lhs_item = lhs.items[little(i)];
+            base_type rhs_item = get_item(rhs, i);
 
             if (is_overflow)
             {
-                ++res_i;
-                is_overflow = res_i == 0;
+                ++lhs_item;
+                is_overflow = (lhs_item == 0);
             }
 
-            res_i += curr_rhs;
-            if (res_i < curr_rhs)
+            base_type & res_item = res.items[little(i)];
+            res_item = lhs_item + rhs_item;
+
+            if (res_item < rhs_item)
                 is_overflow = true;
         }
 
-        if (is_overflow && r_idx < arr_size)
+        return res;
+    }
+
+    template <typename T>
+    constexpr static auto op_multiply(const integer<Bits, Signed> & lhs, const T & rhs)
+    {
+        integer<Bits, Signed> res{};
+#if 1
+        integer<Bits, Signed> lhs2 = op_plus(lhs, shift_left(lhs, 1));
+        integer<Bits, Signed> lhs3 = op_plus(lhs2, shift_left(lhs, 2));
+#endif
+        for (unsigned i = 0; i < item_count; ++i)
         {
-            ++res.m_arr[little(r_idx)];
-            for (int i = arr_size - 1 - r_idx - 1; i >= 0; --i)
+            base_type rhs_item = get_item(rhs, i);
+            unsigned pos = i * base_bits;
+
+            while (rhs_item)
             {
-                if (res.m_arr[big(i + 1)] == 0)
-                    ++res.m_arr[big(i)];
-                else
-                    break;
+#if 1 /// optimization
+                if ((rhs_item & 0x7) == 0x7)
+                {
+                    res = op_plus(res, shift_left(lhs3, pos));
+                    rhs_item >>= 3;
+                    pos += 3;
+                    continue;
+                }
+
+                if ((rhs_item & 0x3) == 0x3)
+                {
+                    res = op_plus(res, shift_left(lhs2, pos));
+                    rhs_item >>= 2;
+                    pos += 2;
+                    continue;
+                }
+#endif
+                if (rhs_item & 1)
+                    res = op_plus(res, shift_left(lhs, pos));
+
+                rhs_item >>= 1;
+                ++pos;
             }
         }
 
@@ -445,17 +465,17 @@ private:
 public:
     constexpr static integer<Bits, Signed> operator_unary_tilda(const integer<Bits, Signed> & lhs) noexcept
     {
-        integer<Bits, Signed> res{};
+        integer<Bits, Signed> res;
 
-        for (int i = 0; i < arr_size; ++i)
-            res.m_arr[any(i)] = ~lhs.m_arr[any(i)];
+        for (unsigned i = 0; i < item_count; ++i)
+            res.items[any(i)] = ~lhs.items[any(i)];
         return res;
     }
 
     constexpr static integer<Bits, Signed>
     operator_unary_minus(const integer<Bits, Signed> & lhs) noexcept(std::is_same_v<Signed, unsigned>)
     {
-        return operator_plus_T(operator_unary_tilda(lhs), 1);
+        return op_plus(operator_unary_tilda(lhs), 1);
     }
 
     template <typename T>
@@ -463,15 +483,14 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            integer<Bits, Signed> t = rhs;
-            if (is_negative(t))
-                return _operator_minus_wide_integer(lhs, operator_unary_minus(t));
+            if (is_negative(rhs))
+                return op_minus(lhs, -rhs);
             else
-                return _operator_plus_wide_integer(lhs, t);
+                return op_plus(lhs, rhs);
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, integer<T::_impl::_Bits, Signed>>::_impl::operator_plus(
                 integer<T::_impl::_Bits, Signed>(lhs), rhs);
         }
@@ -482,100 +501,44 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            integer<Bits, Signed> t = rhs;
-            if (is_negative(t))
-                return _operator_plus_wide_integer(lhs, operator_unary_minus(t));
+            if (is_negative(rhs))
+                return op_plus(lhs, -rhs);
             else
-                return _operator_minus_wide_integer(lhs, t);
+                return op_minus(lhs, rhs);
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, integer<T::_impl::_Bits, Signed>>::_impl::operator_minus(
                 integer<T::_impl::_Bits, Signed>(lhs), rhs);
         }
     }
 
-private:
-    constexpr static integer<Bits, Signed> _operator_minus_wide_integer(
-        const integer<Bits, Signed> & lhs, const integer<Bits, Signed> & rhs) noexcept(std::is_same_v<Signed, unsigned>)
-    {
-        integer<Bits, Signed> res = lhs;
-
-        bool is_underflow = false;
-        for (int idx = 0; idx < arr_size; ++idx)
-        {
-            base_type & res_i = res.m_arr[little(idx)];
-            const base_type rhs_i = rhs.m_arr[little(idx)];
-
-            if (is_underflow)
-            {
-                --res_i;
-                is_underflow = res_i == std::numeric_limits<base_type>::max();
-            }
-
-            if (res_i < rhs_i)
-                is_underflow = true;
-
-            res_i -= rhs_i;
-        }
-
-        return res;
-    }
-
-    constexpr static integer<Bits, Signed> _operator_plus_wide_integer(
-        const integer<Bits, Signed> & lhs, const integer<Bits, Signed> & rhs) noexcept(std::is_same_v<Signed, unsigned>)
-    {
-        integer<Bits, Signed> res = lhs;
-
-        bool is_overflow = false;
-        for (int idx = 0; idx < arr_size; ++idx)
-        {
-            base_type & res_i = res.m_arr[little(idx)];
-            const base_type rhs_i = rhs.m_arr[little(idx)];
-
-            if (is_overflow)
-            {
-                ++res_i;
-                is_overflow = res_i == 0;
-            }
-
-            res_i += rhs_i;
-
-            if (res_i < rhs_i)
-                is_overflow = true;
-        }
-
-        return res;
-    }
-
-public:
     template <typename T>
     constexpr static auto operator_star(const integer<Bits, Signed> & lhs, const T & rhs)
     {
         if constexpr (should_keep_size<T>())
         {
-            const integer<Bits, unsigned> a = make_positive(lhs);
-            integer<Bits, unsigned> t = make_positive(integer<Bits, Signed>(rhs));
+            integer<Bits, Signed> res;
 
-            integer<Bits, Signed> res = 0;
-
-            for (size_t i = 0; i < arr_size * base_bits; ++i)
+            if constexpr (std::is_signed_v<Signed>)
             {
-                if (t.m_arr[little(0)] & 1)
-                    res = operator_plus(res, shift_left(a, i));
-
-                t = shift_right(t, 1);
+                res = op_multiply((is_negative(lhs) ? make_positive(lhs) : lhs),
+                                  (is_negative(rhs) ? make_positive(rhs) : rhs));
+            }
+            else
+            {
+                res = op_multiply(lhs, (is_negative(rhs) ? make_positive(rhs) : rhs));
             }
 
-            if (std::is_same_v<Signed, signed> && is_negative(integer<Bits, Signed>(rhs)) != is_negative(lhs))
+            if (std::is_same_v<Signed, signed> && is_negative(lhs) != is_negative(rhs))
                 res = operator_unary_minus(res);
 
             return res;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_star(T(lhs), rhs);
         }
     }
@@ -585,25 +548,22 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            // static_assert(Signed == std::is_signed<T>::value,
-            //               "warning: operator_more: comparison of integers of different signs");
+            if (std::numeric_limits<T>::is_signed && (is_negative(lhs) != is_negative(rhs)))
+                return is_negative(rhs);
 
-            integer<Bits, Signed> t = rhs;
-
-            if (std::numeric_limits<T>::is_signed && (is_negative(lhs) != is_negative(t)))
-                return is_negative(t);
-
-            for (int i = 0; i < arr_size; ++i)
+            for (unsigned i = 0; i < item_count; ++i)
             {
-                if (lhs.m_arr[big(i)] != t.m_arr[big(i)])
-                    return lhs.m_arr[big(i)] > t.m_arr[big(i)];
+                base_type rhs_item = get_item(rhs, big(i));
+
+                if (lhs.items[big(i)] != rhs_item)
+                    return lhs.items[big(i)] > rhs_item;
             }
 
             return false;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_more(T(lhs), rhs);
         }
     }
@@ -613,23 +573,22 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            // static_assert(Signed == std::is_signed<T>::value,
-            //               "warning: operator_less: comparison of integers of different signs");
-
-            integer<Bits, Signed> t = rhs;
-
-            if (std::numeric_limits<T>::is_signed && (is_negative(lhs) != is_negative(t)))
+            if (std::numeric_limits<T>::is_signed && (is_negative(lhs) != is_negative(rhs)))
                 return is_negative(lhs);
 
-            for (int i = 0; i < arr_size; ++i)
-                if (lhs.m_arr[big(i)] != t.m_arr[big(i)])
-                    return lhs.m_arr[big(i)] < t.m_arr[big(i)];
+            for (unsigned i = 0; i < item_count; ++i)
+            {
+                base_type rhs_item = get_item(rhs, big(i));
+
+                if (lhs.items[big(i)] != rhs_item)
+                    return lhs.items[big(i)] < rhs_item;
+            }
 
             return false;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_less(T(lhs), rhs);
         }
     }
@@ -639,17 +598,19 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            integer<Bits, Signed> t = rhs;
+            for (unsigned i = 0; i < item_count; ++i)
+            {
+                base_type rhs_item = get_item(rhs, any(i));
 
-            for (int i = 0; i < arr_size; ++i)
-                if (lhs.m_arr[any(i)] != t.m_arr[any(i)])
+                if (lhs.items[any(i)] != rhs_item)
                     return false;
+            }
 
             return true;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_eq(T(lhs), rhs);
         }
     }
@@ -659,16 +620,15 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            integer<Bits, Signed> t = rhs;
-            integer<Bits, Signed> res = lhs;
+            integer<Bits, Signed> res;
 
-            for (int i = 0; i < arr_size; ++i)
-                res.m_arr[any(i)] |= t.m_arr[any(i)];
+            for (unsigned i = 0; i < item_count; ++i)
+                res.items[little(i)] = lhs.items[little(i)] | get_item(rhs, i);
             return res;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_pipe(T(lhs), rhs);
         }
     }
@@ -678,43 +638,48 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            integer<Bits, Signed> t = rhs;
-            integer<Bits, Signed> res = lhs;
+            integer<Bits, Signed> res;
 
-            for (int i = 0; i < arr_size; ++i)
-                res.m_arr[any(i)] &= t.m_arr[any(i)];
+            for (unsigned i = 0; i < item_count; ++i)
+                res.items[little(i)] = lhs.items[little(i)] & get_item(rhs, i);
             return res;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, T>::_impl::operator_amp(T(lhs), rhs);
         }
     }
 
 private:
     template <typename T>
-    constexpr static void divide(const T & lhserator, const T & denominator, T & quotient, T & remainder)
+    constexpr static bool is_zero(const T & x)
     {
         bool is_zero = true;
-        for (auto c : denominator.m_arr)
+        for (auto item : x.items)
         {
-            if (c != 0)
+            if (item != 0)
             {
                 is_zero = false;
                 break;
             }
         }
+        return is_zero;
+    }
 
-        if (is_zero)
+    /// returns quotient as result and remainder in numerator.
+    template <typename T>
+    constexpr static T divide(T & numerator, T && denominator)
+    {
+        if (is_zero(denominator))
             throwError("divide by zero");
 
-        T n = lhserator;
-        T d = denominator;
+        T & n = numerator;
+        T & d = denominator;
         T x = 1;
-        T answer = 0;
+        T quotient = 0;
 
-        while (!operator_more(d, n) && operator_eq(operator_amp(shift_right(d, base_bits * arr_size - 1), 1), 0))
+        while (!operator_more(d, n) && operator_eq(operator_amp(shift_right(d, base_bits * item_count - 1), 1), 0))
         {
             x = shift_left(x, 1);
             d = shift_left(d, 1);
@@ -725,15 +690,14 @@ private:
             if (!operator_more(d, n))
             {
                 n = operator_minus(n, d);
-                answer = operator_pipe(answer, x);
+                quotient = operator_pipe(quotient, x);
             }
 
             x = shift_right(x, 1);
             d = shift_right(d, 1);
         }
 
-        quotient = answer;
-        remainder = n;
+        return quotient;
     }
 
 public:
@@ -742,18 +706,16 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            integer<Bits, Signed> o = rhs;
-            integer<Bits, Signed> quotient{}, remainder{};
-            divide(make_positive(lhs), make_positive(o), quotient, remainder);
+            integer<Bits, Signed> numerator = make_positive(lhs);
+            integer<Bits, Signed> quotient = divide(numerator, make_positive(integer<Bits, Signed>(rhs)));
 
-            if (std::is_same_v<Signed, signed> && is_negative(o) != is_negative(lhs))
+            if (std::is_same_v<Signed, signed> && is_negative(rhs) != is_negative(lhs))
                 quotient = operator_unary_minus(quotient);
-
             return quotient;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, integer<T::_impl::_Bits, Signed>>::operator_slash(T(lhs), rhs);
         }
     }
@@ -763,18 +725,16 @@ public:
     {
         if constexpr (should_keep_size<T>())
         {
-            integer<Bits, Signed> o = rhs;
-            integer<Bits, Signed> quotient{}, remainder{};
-            divide(make_positive(lhs), make_positive(o), quotient, remainder);
+            integer<Bits, Signed> remainder = make_positive(lhs);
+            divide(remainder, make_positive(integer<Bits, Signed>(rhs)));
 
             if (std::is_same_v<Signed, signed> && is_negative(lhs))
                 remainder = operator_unary_minus(remainder);
-
             return remainder;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return std::common_type_t<integer<Bits, Signed>, integer<T::_impl::_Bits, Signed>>::operator_percent(T(lhs), rhs);
         }
     }
@@ -788,13 +748,13 @@ public:
             integer<Bits, Signed> t(rhs);
             integer<Bits, Signed> res = lhs;
 
-            for (int i = 0; i < arr_size; ++i)
-                res.m_arr[any(i)] ^= t.m_arr[any(i)];
+            for (unsigned i = 0; i < item_count; ++i)
+                res.items[any(i)] ^= t.items[any(i)];
             return res;
         }
         else
         {
-            static_assert(T::_impl::_is_wide_integer, "");
+            static_assert(IsWideInteger<T>::value);
             return T::operator_circumflex(T(lhs), rhs);
         }
     }
@@ -815,20 +775,20 @@ public:
             {
                 if (*c >= '0' && *c <= '9')
                 {
-                    res = operator_star(res, 16U);
-                    res = operator_plus_T(res, *c - '0');
+                    res = op_multiply(res, 16U);
+                    res = op_plus(res, *c - '0');
                     ++c;
                 }
                 else if (*c >= 'a' && *c <= 'f')
                 {
-                    res = operator_star(res, 16U);
-                    res = operator_plus_T(res, *c - 'a' + 10U);
+                    res = op_multiply(res, 16U);
+                    res = op_plus(res, *c - 'a' + 10U);
                     ++c;
                 }
                 else if (*c >= 'A' && *c <= 'F')
                 { // tolower must be used, but it is not constexpr
-                    res = operator_star(res, 16U);
-                    res = operator_plus_T(res, *c - 'A' + 10U);
+                    res = op_multiply(res, 16U);
+                    res = op_plus(res, *c - 'A' + 10U);
                     ++c;
                 }
                 else
@@ -842,8 +802,8 @@ public:
                 if (*c < '0' || *c > '9')
                     throwError("invalid char from");
 
-                res = operator_star(res, 10U);
-                res = operator_plus_T(res, *c - '0');
+                res = op_multiply(res, 10U);
+                res = op_plus(res, *c - '0');
                 ++c;
             }
         }
@@ -860,7 +820,7 @@ public:
 template <size_t Bits, typename Signed>
 template <typename T>
 constexpr integer<Bits, Signed>::integer(T rhs) noexcept
-    : m_arr{}
+    : items{}
 {
     if constexpr (IsWideInteger<T>::value)
         _impl::wide_integer_from_wide_integer(*this, rhs);
@@ -871,7 +831,7 @@ constexpr integer<Bits, Signed>::integer(T rhs) noexcept
 template <size_t Bits, typename Signed>
 template <typename T>
 constexpr integer<Bits, Signed>::integer(std::initializer_list<T> il) noexcept
-    : m_arr{}
+    : items{}
 {
     if (il.size() == 1)
     {
@@ -967,14 +927,25 @@ constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator^=(const T & rh
 template <size_t Bits, typename Signed>
 constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator<<=(int n) noexcept
 {
-    *this = _impl::shift_left(*this, n);
+    if (static_cast<size_t>(n) >= Bits)
+        *this = 0;
+    else if (n > 0)
+        *this = _impl::shift_left(*this, n);
     return *this;
 }
 
 template <size_t Bits, typename Signed>
 constexpr integer<Bits, Signed> & integer<Bits, Signed>::operator>>=(int n) noexcept
 {
-    *this = _impl::shift_right(*this, n);
+    if (static_cast<size_t>(n) >= Bits)
+    {
+        if (is_negative(*this))
+            *this = -1;
+        else
+            *this = 0;
+    }
+    else if (n > 0)
+        *this = _impl::shift_right(*this, n);
     return *this;
 }
 
@@ -1018,13 +989,16 @@ template <size_t Bits, typename Signed>
 template <class T, class>
 constexpr integer<Bits, Signed>::operator T() const noexcept
 {
-    static_assert(std::numeric_limits<T>::is_integer, "");
-    T res = 0;
-    for (size_t r_idx = 0; r_idx < _impl::arr_size && r_idx < sizeof(T); ++r_idx)
+    if constexpr (std::is_same_v<T, __int128>)
     {
-        res |= (T(m_arr[_impl::little(r_idx)]) << (_impl::base_bits * r_idx));
+        static_assert(Bits >= 128);
+        return (__int128(items[1]) << 64) | items[0];
+    }
+    else
+    {
+        static_assert(std::numeric_limits<T>::is_integer);
+        return items[0];
     }
-    return res;
 }
 
 template <size_t Bits, typename Signed>
@@ -1038,12 +1012,12 @@ constexpr integer<Bits, Signed>::operator long double() const noexcept
         tmp = -tmp;
 
     long double res = 0;
-    for (size_t idx = 0; idx < _impl::arr_size; ++idx)
+    for (unsigned i = 0; i < _impl::item_count; ++i)
     {
         long double t = res;
         res *= std::numeric_limits<base_type>::max();
         res += t;
-        res += tmp.m_arr[_impl::big(idx)];
+        res += tmp.items[_impl::big(i)];
     }
 
     if (_impl::is_negative(*this))
@@ -1187,11 +1161,19 @@ std::common_type_t<Integral, Integral2> constexpr operator^(const Integral & lhs
 template <size_t Bits, typename Signed>
 constexpr integer<Bits, Signed> operator<<(const integer<Bits, Signed> & lhs, int n) noexcept
 {
+    if (static_cast<size_t>(n) >= Bits)
+        return 0;
+    if (n <= 0)
+        return lhs;
     return integer<Bits, Signed>::_impl::shift_left(lhs, n);
 }
 template <size_t Bits, typename Signed>
 constexpr integer<Bits, Signed> operator>>(const integer<Bits, Signed> & lhs, int n) noexcept
 {
+    if (static_cast<size_t>(n) >= Bits)
+        return 0;
+    if (n <= 0)
+        return lhs;
     return integer<Bits, Signed>::_impl::shift_right(lhs, n);
 }
 
@@ -1277,7 +1259,7 @@ struct hash<wide::integer<Bits, Signed>>
     {
         static_assert(Bits % (sizeof(size_t) * 8) == 0);
 
-        const auto * ptr = reinterpret_cast<const size_t *>(lhs.m_arr);
+        const auto * ptr = reinterpret_cast<const size_t *>(lhs.items);
         unsigned count = Bits / (sizeof(size_t) * 8);
 
         size_t res = 0;
diff --git a/tests/queries/0_stateless/01440_big_int_exotic_casts.reference b/tests/queries/0_stateless/01440_big_int_exotic_casts.reference
new file mode 100644
index 00000000000..fb3cdce7ad9
--- /dev/null
+++ b/tests/queries/0_stateless/01440_big_int_exotic_casts.reference
@@ -0,0 +1,292 @@
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+1	1.0	1.00	1.000000	1.0000000
+8	8.0	8.00	8.000000	8.0000000
+27	27.0	27.00	27.000000	27.0000000
+64	64.0	64.00	64.000000	64.0000000
+125	125.0	125.00	125.000000	125.0000000
+216	216.0	216.00	216.000000	216.0000000
+343	343.0	343.00	343.000000	343.0000000
+512	512.0	512.00	512.000000	512.0000000
+729	729.0	729.00	729.000000	729.0000000
+0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+-0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+-0	0.0	0.00	0.000000	0.0000000
+-1	-1.0	-1.00	-1.000000	-1.0000000
+-4	-4.0	-4.00	-4.000000	-4.0000000
+-9	-9.0	-9.00	-9.000000	-9.0000000
+-16	-16.0	-16.00	-16.000000	-16.0000000
+-25	-25.0	-25.00	-25.000000	-25.0000000
+-36	-36.0	-36.00	-36.000000	-36.0000000
+-49	-49.0	-49.00	-49.000000	-49.0000000
+-64	-64.0	-64.00	-64.000000	-64.0000000
+-81	-81.0	-81.00	-81.000000	-81.0000000
+0	0	0	0
+4294967295	4294967295	4294967295	4294967295
+8589934588	8589934588	8589934588	8589934588
+12884901879	12884901879	12884901879	12884901879
+17179869168	17179869168	17179869168	17179869168
+21474836455	21474836455	21474836455	21474836455
+25769803740	25769803740	25769803740	25769803740
+30064771023	30064771023	30064771023	30064771023
+34359738304	34359738304	34359738304	34359738304
+38654705583	38654705583	38654705583	38654705583
+0	0	0	0
+18446744073709551615	18446744073709551615	18446744073709551615	18446744073709551615
+18446744073709551612	18446744073709551612	18446744073709551612	18446744073709551612
+18446744073709551607	18446744073709551607	18446744073709551607	18446744073709551607
+18446744073709551600	18446744073709551600	18446744073709551600	18446744073709551600
+18446744073709551591	18446744073709551591	18446744073709551591	18446744073709551591
+18446744073709551580	18446744073709551580	18446744073709551580	18446744073709551580
+18446744073709551567	18446744073709551567	18446744073709551567	18446744073709551567
+18446744073709551552	18446744073709551552	18446744073709551552	18446744073709551552
+18446744073709551535	18446744073709551535	18446744073709551535	18446744073709551535
+0	0	0	0
+115792089237316195423570985008687907853269984665640564039457584007913129639935	-1	-1	115792089237316195423570985008687907853269984665640564039457584007913129639935
+115792089237316195423570985008687907853269984665640564039457584007913129639932	-4	-4	115792089237316195423570985008687907853269984665640564039457584007913129639932
+115792089237316195423570985008687907853269984665640564039457584007913129639927	-9	-9	115792089237316195423570985008687907853269984665640564039457584007913129639927
+115792089237316195423570985008687907853269984665640564039457584007913129639920	-16	-16	115792089237316195423570985008687907853269984665640564039457584007913129639920
+115792089237316195423570985008687907853269984665640564039457584007913129639911	-25	-25	115792089237316195423570985008687907853269984665640564039457584007913129639911
+115792089237316195423570985008687907853269984665640564039457584007913129639900	-36	-36	115792089237316195423570985008687907853269984665640564039457584007913129639900
+115792089237316195423570985008687907853269984665640564039457584007913129639887	-49	-49	115792089237316195423570985008687907853269984665640564039457584007913129639887
+115792089237316195423570985008687907853269984665640564039457584007913129639872	-64	-64	115792089237316195423570985008687907853269984665640564039457584007913129639872
+115792089237316195423570985008687907853269984665640564039457584007913129639855	-81	-81	115792089237316195423570985008687907853269984665640564039457584007913129639855
+0	0	0	0
+-1	-1	-1	115792089237316195423570985008687907853269984665640564039457584007913129639935
+-4	-4	-4	115792089237316195423570985008687907853269984665640564039457584007913129639932
+-9	-9	-9	115792089237316195423570985008687907853269984665640564039457584007913129639927
+-16	-16	-16	115792089237316195423570985008687907853269984665640564039457584007913129639920
+-25	-25	-25	115792089237316195423570985008687907853269984665640564039457584007913129639911
+-36	-36	-36	115792089237316195423570985008687907853269984665640564039457584007913129639900
+-49	-49	-49	115792089237316195423570985008687907853269984665640564039457584007913129639887
+-64	-64	-64	115792089237316195423570985008687907853269984665640564039457584007913129639872
+-81	-81	-81	115792089237316195423570985008687907853269984665640564039457584007913129639855
+0	0	0	0
+-1	-1	-1	115792089237316195423570985008687907853269984665640564039457584007913129639935
+-4	-4	-4	115792089237316195423570985008687907853269984665640564039457584007913129639932
+-9	-9	-9	115792089237316195423570985008687907853269984665640564039457584007913129639927
+-16	-16	-16	115792089237316195423570985008687907853269984665640564039457584007913129639920
+-25	-25	-25	115792089237316195423570985008687907853269984665640564039457584007913129639911
+-36	-36	-36	115792089237316195423570985008687907853269984665640564039457584007913129639900
+-49	-49	-49	115792089237316195423570985008687907853269984665640564039457584007913129639887
+-64	-64	-64	115792089237316195423570985008687907853269984665640564039457584007913129639872
+-81	-81	-81	115792089237316195423570985008687907853269984665640564039457584007913129639855
+0	0	0	0
+-1	-1	-1	115792089237316195423570985008687907853269984665640564039457584007913129639935
+-4	-4	-4	115792089237316195423570985008687907853269984665640564039457584007913129639932
+-9	-9	-9	115792089237316195423570985008687907853269984665640564039457584007913129639927
+-16	-16	-16	115792089237316195423570985008687907853269984665640564039457584007913129639920
+-25	-25	-25	115792089237316195423570985008687907853269984665640564039457584007913129639911
+-36	-36	-36	115792089237316195423570985008687907853269984665640564039457584007913129639900
+-49	-49	-49	115792089237316195423570985008687907853269984665640564039457584007913129639887
+-64	-64	-64	115792089237316195423570985008687907853269984665640564039457584007913129639872
+-81	-81	-81	115792089237316195423570985008687907853269984665640564039457584007913129639855
+0	0	0	0
+-1	-1	-1	115792089237316195423570985008687907853269984665640564039457584007913129639935
+-4	-4	-4	115792089237316195423570985008687907853269984665640564039457584007913129639932
+-9	-9	-9	115792089237316195423570985008687907853269984665640564039457584007913129639927
+-16	-16	-16	115792089237316195423570985008687907853269984665640564039457584007913129639920
+-25	-25	-25	115792089237316195423570985008687907853269984665640564039457584007913129639911
+-36	-36	-36	115792089237316195423570985008687907853269984665640564039457584007913129639900
+-49	-49	-49	115792089237316195423570985008687907853269984665640564039457584007913129639887
+-64	-64	-64	115792089237316195423570985008687907853269984665640564039457584007913129639872
+-81	-81	-81	115792089237316195423570985008687907853269984665640564039457584007913129639855
+0	0	0	0
+-1	-1	-1	115792089237316195423570985008687907853269984665640564039457584007913129639935
+-4	-4	-4	115792089237316195423570985008687907853269984665640564039457584007913129639932
+-9	-9	-9	115792089237316195423570985008687907853269984665640564039457584007913129639927
+-16	-16	-16	115792089237316195423570985008687907853269984665640564039457584007913129639920
+-25	-25	-25	115792089237316195423570985008687907853269984665640564039457584007913129639911
+-36	-36	-36	115792089237316195423570985008687907853269984665640564039457584007913129639900
+-49	-49	-49	115792089237316195423570985008687907853269984665640564039457584007913129639887
+-64	-64	-64	115792089237316195423570985008687907853269984665640564039457584007913129639872
+-81	-81	-81	115792089237316195423570985008687907853269984665640564039457584007913129639855
+0	0	0	0
+-1	-1	-1	115792089237316195423570985008687907853269984665640564039457584007913129639935
+-4	-4	-4	115792089237316195423570985008687907853269984665640564039457584007913129639932
+-9	-9	-9	115792089237316195423570985008687907853269984665640564039457584007913129639927
+-16	-16	-16	115792089237316195423570985008687907853269984665640564039457584007913129639920
+-25	-25	-25	115792089237316195423570985008687907853269984665640564039457584007913129639911
+-36	-36	-36	115792089237316195423570985008687907853269984665640564039457584007913129639900
+-49	-49	-49	115792089237316195423570985008687907853269984665640564039457584007913129639887
+-64	-64	-64	115792089237316195423570985008687907853269984665640564039457584007913129639872
+-81	-81	-81	115792089237316195423570985008687907853269984665640564039457584007913129639855
+0	0	0	0
+1	0	0	0
+2	0	0	0
+3	0	0	0
+4	0	0	0
+5	0	0	0
+6	0	0	0
+7	0	0	0
+8	0	0	0
+9	0	0	0
+0	0	0	0
+-1	0	0	0
+-2	0	0	0
+-3	0	0	0
+-4	0	0	0
+-5	0	0	0
+-6	0	0	0
+-7	0	0	0
+-8	0	0	0
+-9	0	0	0
+2499500025000000	2499500025000000	2499500025000000	2499500025000000.00
+0	0	0	0.00
diff --git a/tests/queries/0_stateless/01440_big_int_exotic_casts.sql b/tests/queries/0_stateless/01440_big_int_exotic_casts.sql
new file mode 100644
index 00000000000..42fde9da01b
--- /dev/null
+++ b/tests/queries/0_stateless/01440_big_int_exotic_casts.sql
@@ -0,0 +1,48 @@
+SELECT toUInt32(number * number) * number  y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toUInt64(number * number) * number  y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toUInt256(number * number) * number y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt32(number * number) * number   y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt64(number * number) * number   y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt128(number * number) * number  y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt256(number * number) * number  y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toFloat32(number * number) * number y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toFloat64(number * number) * number y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+
+SELECT toUInt32(number * number) * -1  y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toUInt64(number * number) * -1  y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toUInt256(number * number) * -1 y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt32(number * number) * -1   y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt64(number * number) * -1   y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt128(number * number) * -1  y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt256(number * number) * -1  y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toFloat32(number * number) * -1 y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+SELECT toFloat64(number * number) * -1 y, toDecimal32(y, 1), toDecimal64(y, 2), toDecimal128(y, 6), toDecimal256(y, 7) FROM numbers_mt(10) ORDER BY number;
+
+SELECT toUInt32(number * -1) * number  y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+SELECT toUInt64(number * -1) * number  y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+SELECT toUInt256(number * -1) * number y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt32(number * -1) * number   y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt64(number * -1) * number   y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt128(number * -1) * number  y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+SELECT toInt256(number * -1) * number  y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+SELECT toFloat32(number * -1) * number y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+SELECT toFloat64(number * -1) * number y, toInt128(y), toInt256(y), toUInt256(y) FROM numbers_mt(10) ORDER BY number;
+
+SELECT number y, toInt128(number) - y, toInt256(number) - y, toUInt256(number) - y FROM numbers_mt(10) ORDER BY number;
+SELECT -number y, toInt128(number) + y, toInt256(number) + y, toUInt256(number) + y FROM numbers_mt(10) ORDER BY number;
+
+
+SET allow_experimental_bigint_types = 1;
+
+DROP TABLE IF EXISTS t;
+CREATE TABLE t (x UInt64, i256 Int256, u256 UInt256, d256 Decimal256(2)) ENGINE = Memory;
+
+INSERT INTO t SELECT number * number * number AS x, x AS i256, x AS u256, x AS d256 FROM numbers(10000);
+
+SELECT sum(x), sum(i256), sum(u256), sum(d256) FROM t;
+
+INSERT INTO t SELECT -number * number * number AS x, x AS i256, x AS u256, x AS d256 FROM numbers(10000);
+
+SELECT sum(x), sum(i256), sum(u256), sum(d256) FROM t;
+
+DROP TABLE t;