#pragma once #include #include #include #include #include #include #include #include #include #include #include #include #include #include namespace CurrentMetrics { extern const Metric Merge; } namespace DB { struct MergeInfo { std::string database; std::string table; std::string result_part_name; std::string result_part_path; Array source_part_names; Array source_part_paths; std::string partition_id; bool is_mutation; Float64 elapsed; Float64 progress; UInt64 num_parts; UInt64 total_size_bytes_compressed; UInt64 total_size_marks; UInt64 total_rows_count; UInt64 bytes_read_uncompressed; UInt64 bytes_written_uncompressed; UInt64 rows_read; UInt64 rows_written; UInt64 columns_written; UInt64 memory_usage; UInt64 thread_id; std::string merge_type; std::string merge_algorithm; }; struct FutureMergedMutatedPart; struct MergeListElement : boost::noncopyable { const StorageID table_id; std::string partition_id; const std::string result_part_name; const std::string result_part_path; Int64 result_data_version{}; bool is_mutation{}; UInt64 num_parts{}; Names source_part_names; Names source_part_paths; Int64 source_data_version{}; Stopwatch watch; std::atomic progress{}; std::atomic is_cancelled{}; UInt64 total_size_bytes_compressed{}; UInt64 total_size_marks{}; UInt64 total_rows_count{}; std::atomic bytes_read_uncompressed{}; std::atomic bytes_written_uncompressed{}; /// In case of Vertical algorithm they are actual only for primary key columns std::atomic rows_read{}; std::atomic rows_written{}; /// Updated only for Vertical algorithm std::atomic columns_written{}; MemoryTracker memory_tracker{VariableContext::Process}; MemoryTracker * background_thread_memory_tracker; MemoryTracker * background_thread_memory_tracker_prev_parent = nullptr; UInt64 thread_id; MergeType merge_type; /// Detected after merge already started std::atomic merge_algorithm; MergeListElement(const StorageID & table_id_, const FutureMergedMutatedPart & future_part); MergeInfo getInfo() const; ~MergeListElement(); }; using MergeListEntry = BackgroundProcessListEntry; /** Maintains a list of currently running merges. * For implementation of system.merges table. */ class MergeList final : public BackgroundProcessList { private: using Parent = BackgroundProcessList; std::atomic merges_with_ttl_counter = 0; public: MergeList() : Parent(CurrentMetrics::Merge) {} void onEntryDestroy(const Parent::Entry & entry) override { if (isTTLMergeType(entry->merge_type)) --merges_with_ttl_counter; } void cancelPartMutations(const StorageID & table_id, const String & partition_id, Int64 mutation_version) { std::lock_guard lock{mutex}; for (auto & merge_element : entries) { if ((partition_id.empty() || merge_element.partition_id == partition_id) && merge_element.table_id == table_id && merge_element.source_data_version < mutation_version && merge_element.result_data_version >= mutation_version) merge_element.is_cancelled = true; } } /// Merge consists of two parts: assignment and execution. We add merge to /// merge list on execution, but checking merge list during merge /// assignment. This lead to the logical race condition (we can assign more /// merges with TTL than allowed). So we "book" merge with ttl during /// assignment, and remove from list after merge execution. /// /// NOTE: Not important for replicated merge tree, we check count of merges twice: /// in assignment and in queue before execution. void bookMergeWithTTL() { ++merges_with_ttl_counter; } size_t getMergesWithTTLCount() const { return merges_with_ttl_counter; } }; }