#pragma once #include #include #include #include #include #include #include #include #include #include #include namespace DB { /** See the description of the data structure in MergeTreeData. */ class StorageMergeTree : public ext::shared_ptr_helper, public IStorage { public: void startup() override; void shutdown() override; ~StorageMergeTree() override; std::string getName() const override { return data.merging_params.getModeName() + "MergeTree"; } std::string getTableName() const override { return table_name; } bool supportsSampling() const override { return data.supportsSampling(); } bool supportsPrewhere() const override { return data.supportsPrewhere(); } bool supportsFinal() const override { return data.supportsFinal(); } bool supportsIndexForIn() const override { return true; } bool mayBenefitFromIndexForIn(const ASTPtr & left_in_operand) const override { return data.mayBenefitFromIndexForIn(left_in_operand); } const ColumnsDescription & getColumns() const override { return data.getColumns(); } void setColumns(ColumnsDescription columns_) override { return data.setColumns(std::move(columns_)); } NameAndTypePair getColumn(const String & column_name) const override { return data.getColumn(column_name); } bool hasColumn(const String & column_name) const override { return data.hasColumn(column_name); } BlockInputStreams read( const Names & column_names, const SelectQueryInfo & query_info, const Context & context, QueryProcessingStage::Enum & processed_stage, size_t max_block_size, unsigned num_streams) override; BlockOutputStreamPtr write(const ASTPtr & query, const Settings & settings) override; /** Perform the next step in combining the parts. */ bool optimize(const ASTPtr & query, const ASTPtr & partition, bool final, bool deduplicate, const Context & context) override; void dropPartition(const ASTPtr & query, const ASTPtr & partition, bool detach, const Context & context) override; void clearColumnInPartition(const ASTPtr & partition, const Field & column_name, const Context & context) override; void attachPartition(const ASTPtr & partition, bool part, const Context & context) override; void replacePartitionFrom(const StoragePtr & source_table, const ASTPtr & partition, bool replace, const Context & context) override; void freezePartition(const ASTPtr & partition, const String & with_name, const Context & context) override; void mutate(const MutationCommands & commands, const Context & context) override; std::vector getMutationsStatus() const; void drop() override; void truncate(const ASTPtr &) override; void rename(const String & new_path_to_db, const String & new_database_name, const String & new_table_name) override; void alter(const AlterCommands & params, const String & database_name, const String & table_name, const Context & context) override; bool checkTableCanBeDropped() const override; ActionLock getActionLock(StorageActionBlockType action_type) override; MergeTreeData & getData() { return data; } const MergeTreeData & getData() const { return data; } String getDataPath() const override { return full_path; } private: String path; String database_name; String table_name; String full_path; Context & context; BackgroundProcessingPool & background_pool; MergeTreeData data; MergeTreeDataSelectExecutor reader; MergeTreeDataWriter writer; MergeTreeDataMergerMutator merger_mutator; /// For block numbers. SimpleIncrement increment{0}; /// For clearOldParts, clearOldTemporaryDirectories. AtomicStopwatch time_after_previous_cleanup; mutable std::mutex currently_merging_mutex; MergeTreeData::DataParts currently_merging; std::multimap current_mutations_by_version; Logger * log; std::atomic shutdown_called {false}; BackgroundProcessingPool::TaskHandle background_task_handle; void loadMutations(); /** Determines what parts should be merged and merges it. * If aggressive - when selects parts don't takes into account their ratio size and novelty (used for OPTIMIZE query). * Returns true if merge is finished successfully. */ bool merge(size_t aio_threshold, bool aggressive, const String & partition_id, bool final, bool deduplicate, String * out_disable_reason = nullptr); /// Try and find a single part to mutate and mutate it. If some part was successfully mutated, return true. bool tryMutatePart(); bool backgroundTask(); Int64 getCurrentMutationVersion( const MergeTreeData::DataPartPtr & part, std::lock_guard & /* currently_merging_mutex_lock */) const; friend class MergeTreeBlockOutputStream; friend class MergeTreeData; friend struct CurrentlyMergingPartsTagger; protected: /** Attach the table with the appropriate name, along the appropriate path (with / at the end), * (correctness of names and paths are not checked) * consisting of the specified columns. * * primary_expr_ast - expression for sorting; * date_column_name - if not empty, the name of the column with the date used for partitioning by month; otherwise, partition_expr_ast is used as the partitioning expression; */ StorageMergeTree( const String & path_, const String & database_name_, const String & table_name_, const ColumnsDescription & columns_, bool attach, Context & context_, const ASTPtr & primary_expr_ast_, const ASTPtr & secondary_sorting_expr_list_, const String & date_column_name, const ASTPtr & partition_expr_ast_, const ASTPtr & sampling_expression_, /// nullptr, if sampling is not supported. const MergeTreeData::MergingParams & merging_params_, const MergeTreeSettings & settings_, bool has_force_restore_data_flag); }; }