mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-12 17:32:32 +00:00
99 lines
3.6 KiB
C++
99 lines
3.6 KiB
C++
#pragma once
|
|
#include <Processors/QueryPlan/IQueryPlanStep.h>
|
|
|
|
namespace DB
|
|
{
|
|
|
|
/// Step which has single input and single output data stream.
|
|
/// It doesn't mean that pipeline has single port before or after such step.
|
|
class ITransformingStep : public IQueryPlanStep
|
|
{
|
|
public:
|
|
/// This flags are used to automatically set properties for output stream.
|
|
/// They are specified in constructor and cannot be changed.
|
|
struct DataStreamTraits
|
|
{
|
|
/// Keep distinct_columns unchanged.
|
|
/// Examples: true for LimitStep, false for ExpressionStep with ARRAY JOIN
|
|
/// It some columns may be removed from result header, call updateDistinctColumns
|
|
bool preserves_distinct_columns;
|
|
|
|
/// True if pipeline has single output port after this step.
|
|
/// Examples: MergeSortingStep, AggregatingStep
|
|
bool returns_single_stream;
|
|
|
|
/// Won't change the number of ports for pipeline.
|
|
/// Examples: true for ExpressionStep, false for MergeSortingStep
|
|
bool preserves_number_of_streams;
|
|
|
|
/// Doesn't change row order.
|
|
/// Examples: true for FilterStep, false for PartialSortingStep
|
|
bool preserves_sorting;
|
|
};
|
|
|
|
/// This flags are used by QueryPlan optimizers.
|
|
/// They can be changed after some optimizations.
|
|
struct TransformTraits
|
|
{
|
|
/// Won't change the total number of rows.
|
|
/// Examples: true for ExpressionStep (without join or array join), false for FilterStep
|
|
bool preserves_number_of_rows;
|
|
};
|
|
|
|
struct Traits
|
|
{
|
|
DataStreamTraits data_stream_traits;
|
|
TransformTraits transform_traits;
|
|
};
|
|
|
|
ITransformingStep(DataStream input_stream, Block output_header, Traits traits, bool collect_processors_ = true);
|
|
|
|
QueryPipelineBuilderPtr updatePipeline(QueryPipelineBuilders pipelines, const BuildQueryPipelineSettings & settings) override;
|
|
|
|
virtual void transformPipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings & settings) = 0;
|
|
|
|
const TransformTraits & getTransformTraits() const { return transform_traits; }
|
|
const DataStreamTraits & getDataStreamTraits() const { return data_stream_traits; }
|
|
|
|
/// Updates the input stream of the given step. Used during query plan optimizations.
|
|
/// It won't do any validation of a new stream, so it is your responsibility to ensure that this update doesn't break anything
|
|
/// (e.g. you update data stream traits or correctly remove / add columns).
|
|
void updateInputStream(DataStream input_stream)
|
|
{
|
|
input_streams.clear();
|
|
input_streams.emplace_back(std::move(input_stream));
|
|
|
|
updateOutputStream();
|
|
|
|
updateDistinctColumns(output_stream->header, output_stream->distinct_columns);
|
|
}
|
|
|
|
void describePipeline(FormatSettings & settings) const override;
|
|
|
|
/// Append extra processors for this step.
|
|
void appendExtraProcessors(const Processors & extra_processors);
|
|
|
|
protected:
|
|
/// Clear distinct_columns if res_header doesn't contain all of them.
|
|
static void updateDistinctColumns(const Block & res_header, NameSet & distinct_columns);
|
|
|
|
/// Create output stream from header and traits.
|
|
static DataStream createOutputStream(
|
|
const DataStream & input_stream,
|
|
Block output_header,
|
|
const DataStreamTraits & stream_traits);
|
|
|
|
TransformTraits transform_traits;
|
|
|
|
private:
|
|
virtual void updateOutputStream() = 0;
|
|
|
|
/// We collect processors got after pipeline transformation.
|
|
Processors processors;
|
|
bool collect_processors;
|
|
|
|
const DataStreamTraits data_stream_traits;
|
|
};
|
|
|
|
}
|