#pragma once #include #include #include #include #include #include #include namespace DB { class TableJoin; class MergeJoinCursor; struct MergeJoinEqualRange; class IVolume; using VolumePtr = std::shared_ptr; struct SortedBlocksWriter { using TmpFilePtr = std::unique_ptr; using SortedFiles = std::vector; struct Blocks { BlocksList blocks; size_t row_count = 0; size_t bytes = 0; bool empty() const { return blocks.empty(); } void insert(Block && block) { countBlockSize(block); blocks.emplace_back(std::move(block)); } void countBlockSize(const Block & block) { row_count += block.rows(); bytes += block.bytes(); } void clear() { blocks.clear(); row_count = 0; bytes = 0; } }; struct PremergedFiles { SortedFiles files; BlockInputStreams streams; }; static constexpr const size_t num_streams = 2; std::mutex insert_mutex; std::condition_variable flush_condvar; const SizeLimits & size_limits; VolumePtr volume; Block sample_block; const SortDescription & sort_description; Blocks inserted_blocks; const size_t rows_in_block; const size_t num_files_for_merge; const String & codec; SortedFiles sorted_files; size_t row_count_in_flush = 0; size_t bytes_in_flush = 0; size_t flush_number = 0; size_t flush_inflight = 0; SortedBlocksWriter(const SizeLimits & size_limits_, VolumePtr volume_, const Block & sample_block_, const SortDescription & description, size_t rows_in_block_, size_t num_files_to_merge_, const String & codec_) : size_limits(size_limits_) , volume(volume_) , sample_block(sample_block_) , sort_description(description) , rows_in_block(rows_in_block_) , num_files_for_merge(num_files_to_merge_) , codec(codec_) {} void addBlocks(const Blocks & blocks) { sorted_files.emplace_back(flush(blocks.blocks)); } String getPath() const; BlockInputStreamPtr streamFromFile(const TmpFilePtr & file) const; void insert(Block && block); TmpFilePtr flush(const BlocksList & blocks) const; PremergedFiles premerge(); SortedFiles finishMerge(std::function callback = [](const Block &){}); }; class SortedBlocksBuffer { public: SortedBlocksBuffer(const SortDescription & sort_description_, size_t max_bytes_) : max_bytes(max_bytes_) , current_bytes(0) , sort_description(sort_description_) {} Block exchange(Block && block); private: std::mutex mutex; size_t max_bytes; size_t current_bytes; Blocks buffer; const SortDescription & sort_description; Block mergeBlocks(Blocks &&) const; }; }