ClickHouse/dbms/src/DataStreams/DistinctBlockInputStream.h

56 lines
1.4 KiB
C++

#pragma once
#include <DataStreams/IProfilingBlockInputStream.h>
#include <Interpreters/Limits.h>
#include <Interpreters/SetVariants.h>
namespace DB
{
/** This class is intended for implementation of SELECT DISTINCT clause and
* leaves only unique rows in the stream.
*
* To optimize the SELECT DISTINCT ... LIMIT clause we can
* set limit_hint to non zero value. So we stop emitting new rows after
* count of already emitted rows will reach the limit_hint.
*/
class DistinctBlockInputStream : public IProfilingBlockInputStream
{
public:
/// Empty columns_ means all collumns.
DistinctBlockInputStream(const BlockInputStreamPtr & input, const Limits & limits, size_t limit_hint_, const Names & columns);
String getName() const override { return "Distinct"; }
String getID() const override;
protected:
Block readImpl() override;
private:
bool checkLimits() const;
ConstColumnPlainPtrs getKeyColumns(const Block & block) const;
template <typename Method>
void buildFilter(
Method & method,
const ConstColumnPlainPtrs & key_columns,
IColumn::Filter & filter,
size_t rows,
SetVariants & variants) const;
Names columns_names;
SetVariants data;
Sizes key_sizes;
size_t limit_hint;
/// Restrictions on the maximum size of the output data.
size_t max_rows;
size_t max_bytes;
OverflowMode overflow_mode;
};
}