#pragma once #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include namespace CurrentMetrics { extern const Metric Merge; } namespace DB { struct MergeInfo { std::string database; std::string table; std::string result_part_name; std::string result_part_path; Array source_part_names; Array source_part_paths; std::string partition_id; bool is_mutation; Float64 elapsed; Float64 progress; UInt64 num_parts; UInt64 total_size_bytes_compressed; UInt64 total_size_marks; UInt64 total_rows_count; UInt64 bytes_read_uncompressed; UInt64 bytes_written_uncompressed; UInt64 rows_read; UInt64 rows_written; UInt64 columns_written; UInt64 memory_usage; UInt64 thread_id; std::string merge_type; std::string merge_algorithm; }; struct FutureMergedMutatedPart; using FutureMergedMutatedPartPtr = std::shared_ptr; /** * Since merge is executed with multiple threads, this class * switches the parent MemoryTracker to account all the memory used. */ class MemoryTrackerThreadSwitcher : boost::noncopyable { public: explicit MemoryTrackerThreadSwitcher(MemoryTracker * memory_tracker_ptr, UInt64 untracked_memory_limit); ~MemoryTrackerThreadSwitcher(); private: MemoryTracker * background_thread_memory_tracker; MemoryTracker * background_thread_memory_tracker_prev_parent = nullptr; UInt64 prev_untracked_memory_limit; UInt64 prev_untracked_memory; }; using MemoryTrackerThreadSwitcherPtr = std::unique_ptr; struct MergeListElement : boost::noncopyable { const StorageID table_id; std::string partition_id; const std::string result_part_name; const std::string result_part_path; MergeTreePartInfo result_part_info; bool is_mutation{}; UInt64 num_parts{}; Names source_part_names; Names source_part_paths; Int64 source_data_version{}; Stopwatch watch; std::atomic progress{}; std::atomic is_cancelled{}; UInt64 total_size_bytes_compressed{}; UInt64 total_size_marks{}; UInt64 total_rows_count{}; std::atomic bytes_read_uncompressed{}; std::atomic bytes_written_uncompressed{}; /// In case of Vertical algorithm they are actual only for primary key columns std::atomic rows_read{}; std::atomic rows_written{}; /// Updated only for Vertical algorithm std::atomic columns_written{}; MemoryTracker memory_tracker{VariableContext::Process}; UInt64 max_untracked_memory; UInt64 thread_id; MergeType merge_type; /// Detected after merge already started std::atomic merge_algorithm; MergeListElement( const StorageID & table_id_, FutureMergedMutatedPartPtr future_part, UInt64 memory_profiler_step, UInt64 memory_profiler_sample_probability, UInt64 max_untracked_memory_); MergeInfo getInfo() const; MergeListElement * ptr() { return this; } ~MergeListElement(); }; using MergeListEntry = BackgroundProcessListEntry; /** Maintains a list of currently running merges. * For implementation of system.merges table. */ class MergeList final : public BackgroundProcessList { private: using Parent = BackgroundProcessList; std::atomic merges_with_ttl_counter = 0; public: MergeList() : Parent(CurrentMetrics::Merge) {} void onEntryDestroy(const Parent::Entry & entry) override { if (isTTLMergeType(entry->merge_type)) --merges_with_ttl_counter; } void cancelPartMutations(const StorageID & table_id, const String & partition_id, Int64 mutation_version) { std::lock_guard lock{mutex}; for (auto & merge_element : entries) { if ((partition_id.empty() || merge_element.partition_id == partition_id) && merge_element.table_id == table_id && merge_element.source_data_version < mutation_version && merge_element.result_part_info.getDataVersion() >= mutation_version) merge_element.is_cancelled = true; } } void cancelInPartition(const StorageID & table_id, const String & partition_id, Int64 delimiting_block_number) { std::lock_guard lock{mutex}; for (auto & merge_element : entries) { if (merge_element.table_id == table_id && merge_element.partition_id == partition_id && merge_element.result_part_info.min_block < delimiting_block_number) merge_element.is_cancelled = true; } } /// Merge consists of two parts: assignment and execution. We add merge to /// merge list on execution, but checking merge list during merge /// assignment. This lead to the logical race condition (we can assign more /// merges with TTL than allowed). So we "book" merge with ttl during /// assignment, and remove from list after merge execution. /// /// NOTE: Not important for replicated merge tree, we check count of merges twice: /// in assignment and in queue before execution. void bookMergeWithTTL() { ++merges_with_ttl_counter; } size_t getMergesWithTTLCount() const { return merges_with_ttl_counter; } }; }