#pragma once #include #include #include #include #include #include #include #include #include #include namespace DB { class StorageReplicatedMergeTree; /** Removes obsolete data from a table of type ReplicatedMergeTree. */ class ReplicatedMergeTreeCleanupThread { public: explicit ReplicatedMergeTreeCleanupThread(StorageReplicatedMergeTree & storage_); void start() { task->activateAndSchedule(); } void wakeup() { task->schedule(); } void stop() { task->deactivate(); } private: StorageReplicatedMergeTree & storage; String log_name; Poco::Logger * log; BackgroundSchedulePool::TaskHolder task; pcg64 rng{randomSeed()}; void run(); void iterate(); /// Remove old records from ZooKeeper. void clearOldLogs(); /// The replica is marked as "lost" if it is inactive and its log pointer /// is far behind and we are not going to keep logs for it. /// Lost replicas will use different strategy for repair. void markLostReplicas(const std::unordered_map & host_versions_lost_replicas, const std::unordered_map & log_pointers_candidate_lost_replicas, size_t replicas_count, const zkutil::ZooKeeperPtr & zookeeper); using NodeCTimeAndVersionCache = std::map>; /// Remove old block hashes from ZooKeeper. This is done by the leader replica. void clearOldBlocks(const String & blocks_dir_name, UInt64 window_seconds, UInt64 window_size, NodeCTimeAndVersionCache & cached_block_stats); /// Remove old mutations that are done from ZooKeeper. This is done by the leader replica. void clearOldMutations(); NodeCTimeAndVersionCache cached_block_stats_for_sync_inserts; NodeCTimeAndVersionCache cached_block_stats_for_async_inserts; struct NodeWithStat; /// Returns list of blocks (with their stat) sorted by ctime in descending order. void getBlocksSortedByTime(const String & blocks_dir_name, zkutil::ZooKeeper & zookeeper, std::vector & timed_blocks, NodeCTimeAndVersionCache & cached_block_stats); /// TODO Removing old quorum/failed_parts }; }