ClickHouse/src/Storages/MergeTree/MergedBlockOutputStream.cpp

#include <Storages/MergeTree/MergedBlockOutputStream.h>
#include <Interpreters/Context.h>
#include <Poco/File.h>


namespace DB
{

namespace ErrorCodes
{
    extern const int NOT_IMPLEMENTED;
    extern const int LOGICAL_ERROR;
}


MergedBlockOutputStream::MergedBlockOutputStream(
    const MergeTreeDataPartPtr & data_part,
    const StorageMetadataPtr & metadata_snapshot_,
    const NamesAndTypesList & columns_list_,
    const MergeTreeIndices & skip_indices,
    CompressionCodecPtr default_codec,
    bool blocks_are_granules_size)
    : MergedBlockOutputStream(
        data_part,
        metadata_snapshot_,
        columns_list_,
        skip_indices,
        default_codec,
        {},
        data_part->storage.global_context.getSettings().min_bytes_to_use_direct_io,
        blocks_are_granules_size)
{
}

MergedBlockOutputStream::MergedBlockOutputStream(
    const MergeTreeDataPartPtr & data_part,
    const StorageMetadataPtr & metadata_snapshot_,
    const NamesAndTypesList & columns_list_,
    const MergeTreeIndices & skip_indices,
    CompressionCodecPtr default_codec,
    const MergeTreeData::DataPart::ColumnToSize & merged_column_to_size,
    size_t aio_threshold,
    bool blocks_are_granules_size)
    : IMergedBlockOutputStream(data_part, metadata_snapshot_)
    , columns_list(columns_list_)
{
    MergeTreeWriterSettings writer_settings(data_part->storage.global_context.getSettings(),
        data_part->storage.canUseAdaptiveGranularity(), aio_threshold, blocks_are_granules_size);

    if (aio_threshold > 0 && !merged_column_to_size.empty())
    {
        for (const auto & column : columns_list)
        {
            auto size_it = merged_column_to_size.find(column.name);
            if (size_it != merged_column_to_size.end())
                writer_settings.estimated_size += size_it->second;
        }
    }

    volume->getDisk()->createDirectories(part_path);

    writer = data_part->getWriter(columns_list, skip_indices, default_codec, writer_settings);
    writer->initPrimaryIndex();
    writer->initSkipIndices();
}

/// If data is pre-sorted.
void MergedBlockOutputStream::write(const Block & block)
{
    writeImpl(block, nullptr);
}

/** If the data is not sorted, but we pre-calculated the permutation, after which they will be sorted.
    * This method is used to save RAM, since you do not need to keep two blocks at once - the source and the sorted.
    */
void MergedBlockOutputStream::writeWithPermutation(const Block & block, const IColumn::Permutation * permutation)
{
    writeImpl(block, permutation);
}

void MergedBlockOutputStream::writeSuffix()
{
    throw Exception("Method writeSuffix is not supported by MergedBlockOutputStream", ErrorCodes::NOT_IMPLEMENTED);
}

void MergedBlockOutputStream::writeSuffixAndFinalizePart(
        MergeTreeData::MutableDataPartPtr & new_part,
        const NamesAndTypesList * total_columns_list,
        MergeTreeData::DataPart::Checksums * additional_column_checksums)
{
    /// Finish write and get checksums.
    MergeTreeData::DataPart::Checksums checksums;

    if (additional_column_checksums)
        checksums = std::move(*additional_column_checksums);

    /// Finish columns serialization.
    writer->finishDataSerialization(checksums);
    writer->finishPrimaryIndexSerialization(checksums);
    writer->finishSkipIndicesSerialization(checksums);

    NamesAndTypesList part_columns;
    if (!total_columns_list)
        part_columns = columns_list;
    else
        part_columns = *total_columns_list;

    if (storage.format_version >= MERGE_TREE_DATA_MIN_FORMAT_VERSION_WITH_CUSTOM_PARTITIONING || isCompactPart(new_part))
    {
        new_part->partition.store(storage, volume->getDisk(), part_path, checksums);
        if (new_part->minmax_idx.initialized)
            new_part->minmax_idx.store(storage, volume->getDisk(), part_path, checksums);
        else if (rows_count)
            throw Exception("MinMax index was not initialized for new non-empty part " + new_part->name
                + ". It is a bug.", ErrorCodes::LOGICAL_ERROR);

        auto count_out = volume->getDisk()->writeFile(part_path + "count.txt", 4096);
        HashingWriteBuffer count_out_hashing(*count_out);
        writeIntText(rows_count, count_out_hashing);
        count_out_hashing.next();
        checksums.files["count.txt"].file_size = count_out_hashing.count();
        checksums.files["count.txt"].file_hash = count_out_hashing.getHash();
    }

    if (!new_part->ttl_infos.empty())
    {
        /// Write a file with ttl infos in json format.
        auto out = volume->getDisk()->writeFile(part_path + "ttl.txt", 4096);
        HashingWriteBuffer out_hashing(*out);
        new_part->ttl_infos.write(out_hashing);
        checksums.files["ttl.txt"].file_size = out_hashing.count();
        checksums.files["ttl.txt"].file_hash = out_hashing.getHash();
    }

    removeEmptyColumnsFromPart(new_part, part_columns, checksums);

    {
        /// Write a file with a description of columns.
        auto out = volume->getDisk()->writeFile(part_path + "columns.txt", 4096);
        part_columns.writeText(*out);
    }

    {
        /// Write file with checksums.
        auto out = volume->getDisk()->writeFile(part_path + "checksums.txt", 4096);
        checksums.write(*out);
    }

    new_part->setColumns(part_columns);
    new_part->rows_count = rows_count;
    new_part->modification_time = time(nullptr);
    new_part->index = writer->releaseIndexColumns();
    new_part->checksums = checksums;
    new_part->setBytesOnDisk(checksums.getTotalSizeOnDisk());
    new_part->index_granularity = writer->getIndexGranularity();
    new_part->calculateColumnsSizesOnDisk();
}

void MergedBlockOutputStream::writeImpl(const Block & block, const IColumn::Permutation * permutation)
{
    block.checkNumberOfRows();
    size_t rows = block.rows();
    if (!rows)
        return;

    std::unordered_set<String> skip_indexes_column_names_set;
    for (const auto & index : storage.getSecondaryIndices())
        std::copy(index.column_names.cbegin(), index.column_names.cend(),
                std::inserter(skip_indexes_column_names_set, skip_indexes_column_names_set.end()));
    Names skip_indexes_column_names(skip_indexes_column_names_set.begin(), skip_indexes_column_names_set.end());

    Block primary_key_block = getBlockAndPermute(block, storage.getPrimaryKeyColumns(), permutation);
    Block skip_indexes_block = getBlockAndPermute(block, skip_indexes_column_names, permutation);

    writer->write(block, permutation, primary_key_block, skip_indexes_block);
    writer->calculateAndSerializeSkipIndices(skip_indexes_block, rows);
    writer->calculateAndSerializePrimaryIndex(primary_key_block, rows);
    writer->next();

    rows_count += rows;
}

}
Moved headers and sources to same place [#CLICKHOUSE-3]. 2017-04-01 09:19:00 +00:00			`#include <Storages/MergeTree/MergedBlockOutputStream.h>`
Forward declaration for Context as much as possible. Now after changing Context.h 488 modules will be recompiled instead of 582. 2020-05-20 20:16:32 +00:00			`#include <Interpreters/Context.h>`
Less dependencies 2 (#378) * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. * Less dependencies [#CLICKHOUSE-2]. 2017-01-21 04:24:28 +00:00			`#include <Poco/File.h>`

dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00
			`namespace DB`
			`{`

Fixed insufficient type checking in hasAll, hasAny functions 2019-03-14 23:10:51 +00:00			`namespace ErrorCodes`
			`{`
Fixed ErrorCodes, part 3 2020-02-25 18:20:08 +00:00			`extern const int NOT_IMPLEMENTED;`
			`extern const int LOGICAL_ERROR;`
Fixed insufficient type checking in hasAll, hasAny functions 2019-03-14 23:10:51 +00:00			`}`

dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00
			`MergedBlockOutputStream::MergedBlockOutputStream(`
polymorphic parts (development) 2019-11-07 11:11:38 +00:00			`const MergeTreeDataPartPtr & data_part,`
Buildable getSampleBlock in StorageInMemoryMetadata 2020-06-16 15:51:29 +00:00			`const StorageMetadataPtr & metadata_snapshot_,`
Revert "Removed questionable code (2) [#CLICKHOUSE-2]." This reverts commit fcabe8b8886720da24208b12e176f0d09f408698. 2017-12-25 21:57:29 +00:00			`const NamesAndTypesList & columns_list_,`
fix 'ALTER CLEAR INDEX/COLUMN' queries with compact parts 2020-04-10 13:36:51 +00:00			`const MergeTreeIndices & skip_indices,`
polymorphic parts (development) 2019-11-07 11:11:38 +00:00			`CompressionCodecPtr default_codec,`
			`bool blocks_are_granules_size)`
better initialization of MergedBlockOutputStream 2020-02-04 13:34:57 +00:00			`: MergedBlockOutputStream(`
Buildable getSampleBlock in StorageInMemoryMetadata 2020-06-16 15:51:29 +00:00			`data_part,`
			`metadata_snapshot_,`
			`columns_list_,`
			`skip_indices,`
			`default_codec,`
			`{},`
better initialization of MergedBlockOutputStream 2020-02-04 13:34:57 +00:00			`data_part->storage.global_context.getSettings().min_bytes_to_use_direct_io,`
			`blocks_are_granules_size)`
polymorphic parts (development) cleanup 2019-12-18 16:41:11 +00:00			`{`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`}`

			`MergedBlockOutputStream::MergedBlockOutputStream(`
polymorphic parts (development) 2019-11-07 11:11:38 +00:00			`const MergeTreeDataPartPtr & data_part,`
Buildable getSampleBlock in StorageInMemoryMetadata 2020-06-16 15:51:29 +00:00			`const StorageMetadataPtr & metadata_snapshot_,`
Revert "Removed questionable code (2) [#CLICKHOUSE-2]." This reverts commit fcabe8b8886720da24208b12e176f0d09f408698. 2017-12-25 21:57:29 +00:00			`const NamesAndTypesList & columns_list_,`
fix 'ALTER CLEAR INDEX/COLUMN' queries with compact parts 2020-04-10 13:36:51 +00:00			`const MergeTreeIndices & skip_indices,`
polymorphic parts (development) 2019-11-07 11:11:38 +00:00			`CompressionCodecPtr default_codec,`
polymorphic parts (development) 2019-11-05 11:53:22 +00:00			`const MergeTreeData::DataPart::ColumnToSize & merged_column_to_size,`
			`size_t aio_threshold,`
polymorphic parts (development) 2019-11-07 11:11:38 +00:00			`bool blocks_are_granules_size)`
Buildable getSampleBlock in StorageInMemoryMetadata 2020-06-16 15:51:29 +00:00			`: IMergedBlockOutputStream(data_part, metadata_snapshot_)`
fix 2019-07-28 11:10:35 +00:00			`, columns_list(columns_list_)`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`{`
polymorphic parts (development) cleanup 2019-12-18 15:54:45 +00:00			`MergeTreeWriterSettings writer_settings(data_part->storage.global_context.getSettings(),`
better initialization of MergedBlockOutputStream 2020-02-04 13:34:57 +00:00			`data_part->storage.canUseAdaptiveGranularity(), aio_threshold, blocks_are_granules_size);`
polymorphic parts (development) 2019-11-05 11:53:22 +00:00
			`if (aio_threshold > 0 && !merged_column_to_size.empty())`
			`{`
polymorphic parts (development) alter update 2019-12-18 13:09:58 +00:00			`for (const auto & column : columns_list)`
polymorphic parts (development) 2019-11-05 11:53:22 +00:00			`{`
polymorphic parts (development) alter update 2019-12-18 13:09:58 +00:00			`auto size_it = merged_column_to_size.find(column.name);`
			`if (size_it != merged_column_to_size.end())`
			`writer_settings.estimated_size += size_it->second;`
polymorphic parts (development) 2019-11-05 11:53:22 +00:00			`}`
			`}`

VolumePtr instead of DiskPtr in IMergedBlockOutputStream and inherited classes 2020-05-11 17:20:26 +00:00			`volume->getDisk()->createDirectories(part_path);`
better initialization of MergedBlockOutputStream 2020-02-04 13:34:57 +00:00
fix 'ALTER CLEAR INDEX/COLUMN' queries with compact parts 2020-04-10 13:36:51 +00:00			`writer = data_part->getWriter(columns_list, skip_indices, default_codec, writer_settings);`
better initialization of MergedBlockOutputStream 2020-02-04 13:34:57 +00:00			`writer->initPrimaryIndex();`
			`writer->initSkipIndices();`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`}`

Fixed style a bit [#CLICKHOUSE-2] 2018-05-07 02:01:11 +00:00			`/// If data is pre-sorted.`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`void MergedBlockOutputStream::write(const Block & block)`
			`{`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`writeImpl(block, nullptr);`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`}`

translate comments 2017-03-12 19:18:07 +00:00			`/** If the data is not sorted, but we pre-calculated the permutation, after which they will be sorted.`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`* This method is used to save RAM, since you do not need to keep two blocks at once - the source and the sorted.`
			`*/`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`void MergedBlockOutputStream::writeWithPermutation(const Block & block, const IColumn::Permutation * permutation)`
			`{`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`writeImpl(block, permutation);`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`}`

			`void MergedBlockOutputStream::writeSuffix()`
			`{`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`throw Exception("Method writeSuffix is not supported by MergedBlockOutputStream", ErrorCodes::NOT_IMPLEMENTED);`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`}`

serialize partition and minmax index values [#CLICKHOUSE-3000] 2017-08-30 19:03:19 +00:00			`void MergedBlockOutputStream::writeSuffixAndFinalizePart(`
			`MergeTreeData::MutableDataPartPtr & new_part,`
clang-tidy, part 20 2020-03-09 02:55:28 +00:00			`const NamesAndTypesList * total_columns_list,`
serialize partition and minmax index values [#CLICKHOUSE-3000] 2017-08-30 19:03:19 +00:00			`MergeTreeData::DataPart::Checksums * additional_column_checksums)`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`{`
polymorphic parts (development) 2019-10-21 17:23:06 +00:00			`/// Finish write and get checksums.`
			`MergeTreeData::DataPart::Checksums checksums;`

polymorphic parts (development) 2019-10-28 11:00:29 +00:00			`if (additional_column_checksums)`
			`checksums = std::move(*additional_column_checksums);`

Added pre and post serialization for IDataType BinaryBulkWithMultipleStreams. Supported dictionary serialization format with single global dictionary (limited wit max_dictionary_size) and additional keys which are stored per granule. Changed IDataType::enumerateStream interface. Added (de)serialization params for binary bulk with multiple stream (de)serialization. Changed IColumn::index interface. 2018-06-07 18:14:37 +00:00			`/// Finish columns serialization.`
polymorphic parts (development) 2019-11-18 15:18:50 +00:00			`writer->finishDataSerialization(checksums);`
			`writer->finishPrimaryIndexSerialization(checksums);`
polymorphic parts (development) 2019-11-05 11:53:22 +00:00			`writer->finishSkipIndicesSerialization(checksums);`
Add ability to write final mark for MergeTree engines family (#5624) Add the ability to write final mark to MergeTree engines family. 2019-06-18 12:54:27 +00:00
Get rid of removeEmptyColumnsFromPart method based on alterDataPart. 2020-03-13 15:09:55 +00:00			`NamesAndTypesList part_columns;`
clang-tidy, part 20 2020-03-09 02:55:28 +00:00			`if (!total_columns_list)`
Get rid of removeEmptyColumnsFromPart method based on alterDataPart. 2020-03-13 15:09:55 +00:00			`part_columns = columns_list;`
			`else`
			`part_columns = *total_columns_list;`
serialize partition and minmax index values [#CLICKHOUSE-3000] 2017-08-30 19:03:19 +00:00
fix tests 2020-01-22 14:10:35 +00:00			`if (storage.format_version >= MERGE_TREE_DATA_MIN_FORMAT_VERSION_WITH_CUSTOM_PARTITIONING \|\| isCompactPart(new_part))`
fix backward compatibility for new part format: [#CLICKHOUSE-3000] * do not write out partition and minmax index files for old MergeTreeData format * download the part from another replica if there are missing or extra files 2017-10-19 18:20:41 +00:00			`{`
VolumePtr instead of DiskPtr in IMergedBlockOutputStream and inherited classes 2020-05-11 17:20:26 +00:00			`new_part->partition.store(storage, volume->getDisk(), part_path, checksums);`
support empty parts [#CLICKHOUSE-3747] 2018-05-23 19:34:37 +00:00			`if (new_part->minmax_idx.initialized)`
VolumePtr instead of DiskPtr in IMergedBlockOutputStream and inherited classes 2020-05-11 17:20:26 +00:00			`new_part->minmax_idx.store(storage, volume->getDisk(), part_path, checksums);`
add assert that MinMax index is correctly initialized [#CLICKHOUSE-3879] 2018-08-06 16:42:43 +00:00			`else if (rows_count)`
Update MergedBlockOutputStream.cpp 2018-08-06 16:53:34 +00:00			`throw Exception("MinMax index was not initialized for new non-empty part " + new_part->name`
add assert that MinMax index is correctly initialized [#CLICKHOUSE-3879] 2018-08-06 16:42:43 +00:00			`+ ". It is a bug.", ErrorCodes::LOGICAL_ERROR);`
store rows count for part on disk to allow tables without fixed size columns [#CLICKHOUSE-3000] 2017-10-24 14:11:53 +00:00
VolumePtr instead of DiskPtr in IMergedBlockOutputStream and inherited classes 2020-05-11 17:20:26 +00:00			`auto count_out = volume->getDisk()->writeFile(part_path + "count.txt", 4096);`
Storage MergeTree initial support for S3. 2020-02-27 16:47:40 +00:00			`HashingWriteBuffer count_out_hashing(*count_out);`
store rows count for part on disk to allow tables without fixed size columns [#CLICKHOUSE-3000] 2017-10-24 14:11:53 +00:00			`writeIntText(rows_count, count_out_hashing);`
			`count_out_hashing.next();`
			`checksums.files["count.txt"].file_size = count_out_hashing.count();`
			`checksums.files["count.txt"].file_hash = count_out_hashing.getHash();`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`}`

Minor fix. 2019-10-17 18:55:07 +00:00			`if (!new_part->ttl_infos.empty())`
TTL for columns and tables (#4212) Add TTL for columns and tables. 2019-04-15 09:30:45 +00:00			`{`
			`/// Write a file with ttl infos in json format.`
VolumePtr instead of DiskPtr in IMergedBlockOutputStream and inherited classes 2020-05-11 17:20:26 +00:00			`auto out = volume->getDisk()->writeFile(part_path + "ttl.txt", 4096);`
Storage MergeTree initial support for S3. 2020-02-27 16:47:40 +00:00			`HashingWriteBuffer out_hashing(*out);`
TTL for columns and tables (#4212) Add TTL for columns and tables. 2019-04-15 09:30:45 +00:00			`new_part->ttl_infos.write(out_hashing);`
			`checksums.files["ttl.txt"].file_size = out_hashing.count();`
			`checksums.files["ttl.txt"].file_hash = out_hashing.getHash();`
			`}`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00
Get rid of removeEmptyColumnsFromPart method based on alterDataPart. 2020-03-13 15:09:55 +00:00			`removeEmptyColumnsFromPart(new_part, part_columns, checksums);`

Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`{`
			`/// Write a file with a description of columns.`
VolumePtr instead of DiskPtr in IMergedBlockOutputStream and inherited classes 2020-05-11 17:20:26 +00:00			`auto out = volume->getDisk()->writeFile(part_path + "columns.txt", 4096);`
Get rid of removeEmptyColumnsFromPart method based on alterDataPart. 2020-03-13 15:09:55 +00:00			`part_columns.writeText(*out);`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`}`

			`{`
			`/// Write file with checksums.`
VolumePtr instead of DiskPtr in IMergedBlockOutputStream and inherited classes 2020-05-11 17:20:26 +00:00			`auto out = volume->getDisk()->writeFile(part_path + "checksums.txt", 4096);`
Storage MergeTree initial support for S3. 2020-02-27 16:47:40 +00:00			`checksums.write(*out);`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`}`

Get rid of removeEmptyColumnsFromPart method based on alterDataPart. 2020-03-13 15:09:55 +00:00			`new_part->setColumns(part_columns);`
store rows count for part on disk to allow tables without fixed size columns [#CLICKHOUSE-3000] 2017-10-24 14:11:53 +00:00			`new_part->rows_count = rows_count;`
serialize partition and minmax index values [#CLICKHOUSE-3000] 2017-08-30 19:03:19 +00:00			`new_part->modification_time = time(nullptr);`
polymorphic parts (development) 2019-11-18 15:18:50 +00:00			`new_part->index = writer->releaseIndexColumns();`
serialize partition and minmax index values [#CLICKHOUSE-3000] 2017-08-30 19:03:19 +00:00			`new_part->checksums = checksums;`
Remove atomic from bytes_size 2020-03-23 13:32:02 +00:00			`new_part->setBytesOnDisk(checksums.getTotalSizeOnDisk());`
polymorphic parts (development) 2019-11-07 11:11:38 +00:00			`new_part->index_granularity = writer->getIndexGranularity();`
Better size calculation 2020-03-23 12:19:43 +00:00			`new_part->calculateColumnsSizesOnDisk();`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`}`

			`void MergedBlockOutputStream::writeImpl(const Block & block, const IColumn::Permutation * permutation)`
			`{`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`block.checkNumberOfRows();`
			`size_t rows = block.rows();`
Deep debugging 2018-12-04 14:44:42 +00:00			`if (!rows)`
			`return;`
Compilable code! 2018-11-30 15:36:10 +00:00
better writer for compact parts 2019-12-27 21:17:53 +00:00			`std::unordered_set<String> skip_indexes_column_names_set;`
Rename to methods 2020-06-01 11:29:11 +00:00			`for (const auto & index : storage.getSecondaryIndices())`
I'm able to build it 2020-05-28 12:37:05 +00:00			`std::copy(index.column_names.cbegin(), index.column_names.cend(),`
fix 2019-02-14 16:59:26 +00:00			`std::inserter(skip_indexes_column_names_set, skip_indexes_column_names_set.end()));`
			`Names skip_indexes_column_names(skip_indexes_column_names_set.begin(), skip_indexes_column_names_set.end());`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00
Better 2020-05-21 19:46:03 +00:00			`Block primary_key_block = getBlockAndPermute(block, storage.getPrimaryKeyColumns(), permutation);`
polymorphic parts (development) alter 2019-12-09 21:21:17 +00:00			`Block skip_indexes_block = getBlockAndPermute(block, skip_indexes_column_names, permutation);`
Data Skipping Indices (#4143) * made index parser * added index parsing * some fixes * added index interface and factory * fixed compilation * ptrs * added indexParts * indextypes * index condition * IndexCondition * added indexes in selectexecutor * fix * changed comment * fix * added granularity * comments * fix * fix * added writing indexes * removed indexpart class * fix * added setSkipIndexes * add rw for MergeTreeIndexes * fixes * upd error * fix * fix * reading * test index * fixed nullptr error * fixed * fix * unique names * asts -> exprlist * minmax index * fix * fixed select * fixed merging * fixed mutation * working minmax * removed test index * fixed style * added indexes to checkDataPart * added tests for minmax index * fixed constructor * fix style * fixed includes * fixed setSkipIndexes * added indexes meta to zookeeper * added parsing * removed throw * alter cmds parse * fix * added alter * fix * alters fix * fix alters * fix "after" * fixed alter * alter fix + test * fixes * upd setSkipIndexes * fixed alter bug with drop all indices * fix metadata editing * new test and repl fix * rm test files * fixed repl alter * fix * fix * indices * MTReadStream * upd test for bug * fix * added useful parsers and ast classes * fix * fix comments * replaced columns * fix * fixed parsing * fixed printing * fix err * basic IndicesDescription * go to IndicesDescr * moved indices * go to indicesDescr * fix test minmax_index* * fixed MT alter * fixed bug with replMT indices storing in zk * rename * refactoring * docs ru * docs ru * docs en * refactor * rename tests * fix docs * refactoring * fix * fix * fix * fixed style * unique idx * unique * fix * better minmax calculation * upd * added getBlock * unique_condition * added termForAST * unique * fixed not * uniqueCondition::mayBeTrueOnGranule * fix * fixed bug with double column * is always true * fix * key set * spaces * test * tests * fix * unique * fix * fix * fixed bug with duplicate column * removed unused data * fix * fixes * __bitSwapLastTwo * fix 2019-02-05 14:50:25 +00:00
polymorphic parts (development) 2019-11-07 11:11:38 +00:00			`writer->write(block, permutation, primary_key_block, skip_indexes_block);`
polymorphic parts (development) 2019-11-05 11:53:22 +00:00			`writer->calculateAndSerializeSkipIndices(skip_indexes_block, rows);`
polymorphic parts (development) 2019-11-07 11:11:38 +00:00			`writer->calculateAndSerializePrimaryIndex(primary_key_block, rows);`
polymorphic parts (development) 2019-11-05 11:53:22 +00:00			`writer->next();`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00
store rows count for part on disk to allow tables without fixed size columns [#CLICKHOUSE-3000] 2017-10-24 14:11:53 +00:00			`rows_count += rows;`
dbms: NULL support for MergeTree [#METR-19266] 2016-07-21 16:22:24 +00:00			`}`

			`}`