2017-06-14 10:50:22 +00:00
|
|
|
#pragma once
|
|
|
|
#include <Core/Block.h>
|
2022-04-27 15:05:45 +00:00
|
|
|
#include <Common/logger_useful.h>
|
2022-10-31 08:00:56 +00:00
|
|
|
#include <Columns/ColumnVector.h>
|
|
|
|
#include <Columns/ColumnsCommon.h>
|
2022-11-16 17:48:08 +00:00
|
|
|
#include <Columns/FilterDescription.h>
|
2018-04-02 12:31:04 +00:00
|
|
|
#include <Storages/MergeTree/MarkRange.h>
|
2017-06-14 10:50:22 +00:00
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2018-03-05 14:41:43 +00:00
|
|
|
template <typename T>
|
|
|
|
class ColumnVector;
|
|
|
|
using ColumnUInt8 = ColumnVector<UInt8>;
|
|
|
|
|
2019-10-10 16:30:30 +00:00
|
|
|
class IMergeTreeReader;
|
2019-05-14 09:58:33 +00:00
|
|
|
class MergeTreeIndexGranularity;
|
2019-11-15 03:38:35 +00:00
|
|
|
struct PrewhereInfo;
|
2021-02-13 22:07:13 +00:00
|
|
|
using PrewhereInfoPtr = std::shared_ptr<PrewhereInfo>;
|
2017-06-14 10:50:22 +00:00
|
|
|
|
2021-06-25 14:49:28 +00:00
|
|
|
class ExpressionActions;
|
|
|
|
using ExpressionActionsPtr = std::shared_ptr<ExpressionActions>;
|
|
|
|
|
2022-06-13 13:00:26 +00:00
|
|
|
struct PrewhereExprStep
|
2022-06-07 07:03:11 +00:00
|
|
|
{
|
|
|
|
ExpressionActionsPtr actions;
|
|
|
|
String column_name;
|
|
|
|
bool remove_column = false;
|
|
|
|
bool need_filter = false;
|
|
|
|
};
|
|
|
|
|
|
|
|
/// The same as PrewhereInfo, but with ExpressionActions instead of ActionsDAG
|
|
|
|
struct PrewhereExprInfo
|
|
|
|
{
|
|
|
|
std::vector<PrewhereExprStep> steps;
|
|
|
|
|
2022-06-07 21:00:34 +00:00
|
|
|
std::string dump() const;
|
2023-02-23 12:31:56 +00:00
|
|
|
|
|
|
|
std::string dumpConditions() const;
|
2022-06-07 07:03:11 +00:00
|
|
|
};
|
|
|
|
|
2022-10-04 11:59:11 +00:00
|
|
|
class FilterWithCachedCount
|
|
|
|
{
|
2022-12-13 14:01:33 +00:00
|
|
|
ConstantFilterDescription const_description; /// TODO: ConstantFilterDescription only checks always true/false for const columns
|
|
|
|
/// think how to handle when the column in not const but has all 0s or all 1s
|
2022-10-04 11:59:11 +00:00
|
|
|
ColumnPtr column = nullptr;
|
|
|
|
const IColumn::Filter * data = nullptr;
|
|
|
|
mutable size_t cached_count_bytes = -1;
|
|
|
|
|
|
|
|
public:
|
|
|
|
explicit FilterWithCachedCount() = default;
|
|
|
|
|
|
|
|
explicit FilterWithCachedCount(const ColumnPtr & column_)
|
2022-12-13 14:01:33 +00:00
|
|
|
: const_description(*column_)
|
2022-10-04 11:59:11 +00:00
|
|
|
{
|
2022-11-16 17:48:08 +00:00
|
|
|
ColumnPtr col = column_->convertToFullIfNeeded();
|
|
|
|
FilterDescription desc(*col);
|
|
|
|
column = desc.data_holder ? desc.data_holder : col;
|
|
|
|
data = desc.data;
|
2022-10-04 11:59:11 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
bool present() const { return !!column; }
|
|
|
|
|
2022-12-13 14:01:33 +00:00
|
|
|
bool alwaysTrue() const { return const_description.always_true; }
|
|
|
|
bool alwaysFalse() const { return const_description.always_false; }
|
|
|
|
|
2022-12-28 14:19:33 +00:00
|
|
|
ColumnPtr getColumn() const { return column; }
|
2022-10-04 11:59:11 +00:00
|
|
|
|
|
|
|
const IColumn::Filter & getData() const { return *data; }
|
|
|
|
|
|
|
|
size_t size() const { return column->size(); }
|
|
|
|
|
|
|
|
size_t countBytesInFilter() const
|
|
|
|
{
|
|
|
|
if (cached_count_bytes == size_t(-1))
|
|
|
|
cached_count_bytes = DB::countBytesInFilter(*data);
|
|
|
|
return cached_count_bytes;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2017-07-11 09:32:39 +00:00
|
|
|
/// MergeTreeReader iterator which allows sequential reading for arbitrary number of rows between pairs of marks in the same part.
|
2017-07-11 17:59:07 +00:00
|
|
|
/// Stores reading state, which can be inside granule. Can skip rows in current granule and start reading from next mark.
|
|
|
|
/// Used generally for reading number of rows less than index granularity to decrease cache misses for fat blocks.
|
2018-02-20 11:45:58 +00:00
|
|
|
class MergeTreeRangeReader
|
2017-06-14 10:50:22 +00:00
|
|
|
{
|
|
|
|
public:
|
2019-11-15 03:38:35 +00:00
|
|
|
MergeTreeRangeReader(
|
2020-01-09 12:54:37 +00:00
|
|
|
IMergeTreeReader * merge_tree_reader_,
|
2019-11-15 03:38:35 +00:00
|
|
|
MergeTreeRangeReader * prev_reader_,
|
2022-06-07 07:03:11 +00:00
|
|
|
const PrewhereExprStep * prewhere_info_,
|
2022-03-15 06:34:25 +00:00
|
|
|
bool last_reader_in_chain_,
|
2022-04-11 13:43:09 +00:00
|
|
|
const Names & non_const_virtual_column_names);
|
2017-06-15 17:01:13 +00:00
|
|
|
|
2018-02-20 11:45:58 +00:00
|
|
|
MergeTreeRangeReader() = default;
|
2017-06-20 10:12:20 +00:00
|
|
|
|
2018-02-20 11:50:33 +00:00
|
|
|
bool isReadingFinished() const;
|
2017-07-11 09:32:39 +00:00
|
|
|
|
2018-02-20 11:50:33 +00:00
|
|
|
size_t numReadRowsInCurrentGranule() const;
|
|
|
|
size_t numPendingRowsInCurrentGranule() const;
|
2019-03-28 15:03:49 +00:00
|
|
|
size_t numRowsInCurrentGranule() const;
|
|
|
|
size_t currentMark() const;
|
2018-02-20 11:45:58 +00:00
|
|
|
|
2018-02-20 11:50:33 +00:00
|
|
|
bool isCurrentRangeFinished() const;
|
2018-02-20 11:45:58 +00:00
|
|
|
bool isInitialized() const { return is_initialized; }
|
2017-06-15 17:01:13 +00:00
|
|
|
|
2022-05-06 13:06:56 +00:00
|
|
|
private:
|
2022-04-11 13:43:09 +00:00
|
|
|
/// Accumulates sequential read() requests to perform a large read instead of multiple small reads
|
2018-02-13 19:34:15 +00:00
|
|
|
class DelayedStream
|
|
|
|
{
|
|
|
|
public:
|
2018-02-20 11:45:58 +00:00
|
|
|
DelayedStream() = default;
|
2021-10-15 08:36:26 +00:00
|
|
|
DelayedStream(size_t from_mark, size_t current_task_last_mark_, IMergeTreeReader * merge_tree_reader);
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2018-11-14 11:26:44 +00:00
|
|
|
/// Read @num_rows rows from @from_mark starting from @offset row
|
2018-02-13 19:34:15 +00:00
|
|
|
/// Returns the number of rows added to block.
|
|
|
|
/// NOTE: have to return number of rows because block has broken invariant:
|
|
|
|
/// some columns may have different size (for example, default columns may be zero size).
|
2019-09-23 19:22:02 +00:00
|
|
|
size_t read(Columns & columns, size_t from_mark, size_t offset, size_t num_rows);
|
2018-11-14 11:26:44 +00:00
|
|
|
|
|
|
|
/// Skip extra rows to current_offset and perform actual reading
|
2019-09-23 19:22:02 +00:00
|
|
|
size_t finalize(Columns & columns);
|
2018-02-13 19:34:15 +00:00
|
|
|
|
|
|
|
bool isFinished() const { return is_finished; }
|
|
|
|
|
|
|
|
private:
|
2018-02-20 11:45:58 +00:00
|
|
|
size_t current_mark = 0;
|
2018-11-14 11:26:44 +00:00
|
|
|
/// Offset from current mark in rows
|
2018-02-20 11:45:58 +00:00
|
|
|
size_t current_offset = 0;
|
2018-11-14 11:26:44 +00:00
|
|
|
/// Num of rows we have to read
|
2018-02-20 11:45:58 +00:00
|
|
|
size_t num_delayed_rows = 0;
|
2021-10-15 08:36:26 +00:00
|
|
|
/// Last mark from all ranges of current task.
|
|
|
|
size_t current_task_last_mark = 0;
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2018-11-14 11:26:44 +00:00
|
|
|
/// Actual reader of data from disk
|
2019-10-10 16:30:30 +00:00
|
|
|
IMergeTreeReader * merge_tree_reader = nullptr;
|
2019-03-30 13:44:23 +00:00
|
|
|
const MergeTreeIndexGranularity * index_granularity = nullptr;
|
2018-02-20 11:45:58 +00:00
|
|
|
bool continue_reading = false;
|
|
|
|
bool is_finished = true;
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2018-11-14 11:26:44 +00:00
|
|
|
/// Current position from the begging of file in rows
|
2018-02-13 19:34:15 +00:00
|
|
|
size_t position() const;
|
2019-09-23 19:22:02 +00:00
|
|
|
size_t readRows(Columns & columns, size_t num_rows);
|
2018-02-13 19:34:15 +00:00
|
|
|
};
|
|
|
|
|
2018-11-14 11:26:44 +00:00
|
|
|
/// Very thin wrapper for DelayedStream
|
|
|
|
/// Check bounds of read ranges and make steps between marks
|
2018-02-13 19:34:15 +00:00
|
|
|
class Stream
|
|
|
|
{
|
|
|
|
public:
|
2018-02-20 11:45:58 +00:00
|
|
|
Stream() = default;
|
2021-10-15 08:36:26 +00:00
|
|
|
Stream(size_t from_mark, size_t to_mark,
|
|
|
|
size_t current_task_last_mark, IMergeTreeReader * merge_tree_reader);
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2018-10-09 14:30:05 +00:00
|
|
|
/// Returns the number of rows added to block.
|
2019-09-23 19:22:02 +00:00
|
|
|
size_t read(Columns & columns, size_t num_rows, bool skip_remaining_rows_in_current_granule);
|
|
|
|
size_t finalize(Columns & columns);
|
2018-02-13 19:34:15 +00:00
|
|
|
void skip(size_t num_rows);
|
|
|
|
|
|
|
|
void finish() { current_mark = last_mark; }
|
|
|
|
bool isFinished() const { return current_mark >= last_mark; }
|
|
|
|
|
|
|
|
size_t numReadRowsInCurrentGranule() const { return offset_after_current_mark; }
|
2019-03-28 08:52:09 +00:00
|
|
|
size_t numPendingRowsInCurrentGranule() const
|
|
|
|
{
|
2019-03-25 16:55:48 +00:00
|
|
|
return current_mark_index_granularity - numReadRowsInCurrentGranule();
|
|
|
|
}
|
2018-11-14 11:26:44 +00:00
|
|
|
size_t numPendingGranules() const { return last_mark - current_mark; }
|
|
|
|
size_t numPendingRows() const;
|
2019-03-28 15:03:49 +00:00
|
|
|
size_t currentMark() const { return current_mark; }
|
2022-03-15 06:34:25 +00:00
|
|
|
UInt64 currentPartOffset() const;
|
|
|
|
UInt64 lastPartOffset() const;
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2018-02-20 11:45:58 +00:00
|
|
|
size_t current_mark = 0;
|
2018-02-13 19:34:15 +00:00
|
|
|
/// Invariant: offset_after_current_mark + skipped_rows_after_offset < index_granularity
|
2018-02-20 11:45:58 +00:00
|
|
|
size_t offset_after_current_mark = 0;
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2021-10-15 08:36:26 +00:00
|
|
|
/// Last mark in current range.
|
2018-02-20 11:45:58 +00:00
|
|
|
size_t last_mark = 0;
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2019-10-10 16:30:30 +00:00
|
|
|
IMergeTreeReader * merge_tree_reader = nullptr;
|
2019-03-30 13:44:23 +00:00
|
|
|
const MergeTreeIndexGranularity * index_granularity = nullptr;
|
2019-03-27 15:57:14 +00:00
|
|
|
|
|
|
|
size_t current_mark_index_granularity = 0;
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2019-03-27 16:23:38 +00:00
|
|
|
DelayedStream stream;
|
|
|
|
|
2018-02-13 19:34:15 +00:00
|
|
|
void checkNotFinished() const;
|
2018-02-20 11:45:58 +00:00
|
|
|
void checkEnoughSpaceInCurrentGranule(size_t num_rows) const;
|
2019-09-23 19:22:02 +00:00
|
|
|
size_t readRows(Columns & columns, size_t num_rows);
|
2018-11-14 11:26:44 +00:00
|
|
|
void toNextMark();
|
2019-12-02 17:10:22 +00:00
|
|
|
size_t ceilRowsToCompleteGranules(size_t rows_num) const;
|
2018-02-13 19:34:15 +00:00
|
|
|
};
|
|
|
|
|
2022-05-06 13:06:56 +00:00
|
|
|
public:
|
2018-02-13 19:34:15 +00:00
|
|
|
/// Statistics after next reading step.
|
|
|
|
class ReadResult
|
|
|
|
{
|
|
|
|
public:
|
2022-05-06 13:06:56 +00:00
|
|
|
Columns columns;
|
|
|
|
size_t num_rows = 0;
|
|
|
|
|
|
|
|
/// The number of rows were added to block as a result of reading chain.
|
|
|
|
size_t numReadRows() const { return num_read_rows; }
|
|
|
|
/// The number of bytes read from disk.
|
|
|
|
size_t numBytesRead() const { return num_bytes_read; }
|
|
|
|
|
|
|
|
private:
|
|
|
|
/// Only MergeTreeRangeReader is supposed to access ReadResult internals.
|
|
|
|
friend class MergeTreeRangeReader;
|
|
|
|
|
2018-02-22 12:43:57 +00:00
|
|
|
using NumRows = std::vector<size_t>;
|
|
|
|
|
2018-02-20 11:45:58 +00:00
|
|
|
struct RangeInfo
|
|
|
|
{
|
|
|
|
size_t num_granules_read_before_start;
|
|
|
|
MarkRange range;
|
|
|
|
};
|
|
|
|
|
2018-02-22 12:43:57 +00:00
|
|
|
using RangesInfo = std::vector<RangeInfo>;
|
|
|
|
|
2022-10-31 08:00:56 +00:00
|
|
|
explicit ReadResult(Poco::Logger * log_) : log(log_) {}
|
2018-02-20 11:45:58 +00:00
|
|
|
|
2022-05-06 13:06:56 +00:00
|
|
|
static size_t getLastMark(const MergeTreeRangeReader::ReadResult::RangesInfo & ranges);
|
|
|
|
|
2019-09-23 19:22:02 +00:00
|
|
|
void addGranule(size_t num_rows_);
|
2018-02-20 13:37:04 +00:00
|
|
|
void adjustLastGranule();
|
2018-03-05 14:41:43 +00:00
|
|
|
void addRows(size_t rows) { num_read_rows += rows; }
|
2018-02-20 11:54:32 +00:00
|
|
|
void addRange(const MarkRange & range) { started_ranges.push_back({rows_per_granule.size(), range}); }
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2022-12-28 14:19:33 +00:00
|
|
|
/// Add current step filter to the result and then for each granule calculate the number of filtered rows at the end.
|
|
|
|
/// Remove them and update filter.
|
|
|
|
/// Apply the filter to the columns and update num_rows if required
|
|
|
|
void optimize(const FilterWithCachedCount & current_filter, bool can_read_incomplete_granules);
|
2018-02-13 19:34:15 +00:00
|
|
|
/// Remove all rows from granules.
|
|
|
|
void clear();
|
|
|
|
|
2019-11-15 03:38:35 +00:00
|
|
|
void setFilterConstTrue();
|
|
|
|
|
2018-02-20 14:26:22 +00:00
|
|
|
void addNumBytesRead(size_t count) { num_bytes_read += count; }
|
|
|
|
|
2022-10-31 08:00:56 +00:00
|
|
|
/// Shrinks columns according to the diff between current and previous rows_per_granule.
|
|
|
|
void shrink(Columns & old_columns, const NumRows & rows_per_granule_previous) const;
|
|
|
|
|
2022-12-28 14:19:33 +00:00
|
|
|
/// Applies the filter to the columns and updates num_rows.
|
|
|
|
void applyFilter(const FilterWithCachedCount & filter);
|
|
|
|
|
2022-10-31 08:00:56 +00:00
|
|
|
/// Verifies that columns and filter sizes match.
|
|
|
|
/// The checks might be non-trivial so it make sense to have the only in debug builds.
|
|
|
|
void checkInternalConsistency() const;
|
2019-11-15 03:38:35 +00:00
|
|
|
|
2022-11-16 17:48:08 +00:00
|
|
|
std::string dumpInfo() const;
|
|
|
|
|
2022-12-28 14:19:33 +00:00
|
|
|
/// Contains columns that are not included into result but might be needed for default values calculation.
|
2022-12-24 23:04:52 +00:00
|
|
|
Block additional_columns;
|
2018-02-20 11:45:58 +00:00
|
|
|
|
2018-02-22 12:43:57 +00:00
|
|
|
RangesInfo started_ranges;
|
2018-02-13 19:34:15 +00:00
|
|
|
/// The number of rows read from each granule.
|
2018-11-14 11:26:44 +00:00
|
|
|
/// Granule here is not number of rows between two marks
|
|
|
|
/// It's amount of rows per single reading act
|
2018-02-22 12:43:57 +00:00
|
|
|
NumRows rows_per_granule;
|
2018-02-13 19:34:15 +00:00
|
|
|
/// Sum(rows_per_granule)
|
2018-03-05 14:41:43 +00:00
|
|
|
size_t total_rows_per_granule = 0;
|
|
|
|
/// The number of rows was read at first step. May be zero if no read columns present in part.
|
2018-02-13 19:34:15 +00:00
|
|
|
size_t num_read_rows = 0;
|
2018-02-22 12:43:57 +00:00
|
|
|
/// The number of rows was removed from last granule after clear or optimize.
|
|
|
|
size_t num_rows_to_skip_in_last_granule = 0;
|
2018-02-20 14:26:22 +00:00
|
|
|
/// Without any filtration.
|
|
|
|
size_t num_bytes_read = 0;
|
2022-12-24 23:04:52 +00:00
|
|
|
|
|
|
|
/// This filter has the size of total_rows_per_granule. This means that it can be applied to newly read columns.
|
|
|
|
/// The result of applying this filter is that only rows that pass all previous filtering steps will remain.
|
2022-11-16 17:48:08 +00:00
|
|
|
FilterWithCachedCount final_filter;
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2022-12-28 14:19:33 +00:00
|
|
|
/// This flag is true when prewhere column can be returned without filtering.
|
|
|
|
/// It's true when it contains 0s from all filtering steps (not just the step when it was calculated).
|
|
|
|
/// NOTE: If we accumulated the final_filter for several steps without applying it then prewhere column calculated at the last step
|
|
|
|
/// will not contain 0s from all previous steps.
|
|
|
|
bool can_return_prewhere_column_without_filtering = true;
|
|
|
|
|
|
|
|
/// Checks if result columns have current final_filter applied.
|
|
|
|
bool filterWasApplied() const { return !final_filter.present() || final_filter.countBytesInFilter() == num_rows; }
|
|
|
|
|
2022-10-31 08:00:56 +00:00
|
|
|
/// Builds updated filter by cutting zeros in granules tails
|
|
|
|
void collapseZeroTails(const IColumn::Filter & filter, const NumRows & rows_per_granule_previous, IColumn::Filter & new_filter) const;
|
2019-12-05 12:27:31 +00:00
|
|
|
size_t countZeroTails(const IColumn::Filter & filter, NumRows & zero_tails, bool can_read_incomplete_granules) const;
|
2018-02-13 19:34:15 +00:00
|
|
|
static size_t numZerosInTail(const UInt8 * begin, const UInt8 * end);
|
2019-11-15 03:38:35 +00:00
|
|
|
|
2022-10-31 08:00:56 +00:00
|
|
|
Poco::Logger * log;
|
2018-02-13 19:34:15 +00:00
|
|
|
};
|
|
|
|
|
2018-02-20 11:45:58 +00:00
|
|
|
ReadResult read(size_t max_rows, MarkRanges & ranges);
|
2017-06-14 10:50:22 +00:00
|
|
|
|
2022-12-23 14:21:57 +00:00
|
|
|
const Block & getSampleBlock() const { return result_sample_block; }
|
2019-09-26 17:29:41 +00:00
|
|
|
|
2017-06-14 10:50:22 +00:00
|
|
|
private:
|
2018-02-20 11:45:58 +00:00
|
|
|
ReadResult startReadingChain(size_t max_rows, MarkRanges & ranges);
|
2022-06-13 13:00:26 +00:00
|
|
|
Columns continueReadingChain(const ReadResult & result, size_t & num_rows);
|
2022-11-16 17:48:08 +00:00
|
|
|
void executePrewhereActionsAndFilterColumns(ReadResult & result) const;
|
2022-12-23 14:21:57 +00:00
|
|
|
void fillPartOffsetColumn(ReadResult & result, UInt64 leading_begin_part_offset, UInt64 leading_end_part_offset);
|
2018-02-13 19:34:15 +00:00
|
|
|
|
2019-10-10 16:30:30 +00:00
|
|
|
IMergeTreeReader * merge_tree_reader = nullptr;
|
2019-03-30 13:44:23 +00:00
|
|
|
const MergeTreeIndexGranularity * index_granularity = nullptr;
|
2018-02-20 11:45:58 +00:00
|
|
|
MergeTreeRangeReader * prev_reader = nullptr; /// If not nullptr, read from prev_reader firstly.
|
2022-06-07 07:03:11 +00:00
|
|
|
const PrewhereExprStep * prewhere_info;
|
2018-02-20 11:45:58 +00:00
|
|
|
|
|
|
|
Stream stream;
|
2017-06-14 10:50:22 +00:00
|
|
|
|
2022-12-23 14:21:57 +00:00
|
|
|
Block read_sample_block; /// Block with columns that are actually read from disk + non-const virtual columns that are filled at this step.
|
|
|
|
Block result_sample_block; /// Block with columns that are returned by this step.
|
2019-09-26 17:29:41 +00:00
|
|
|
|
2018-03-05 14:41:43 +00:00
|
|
|
bool last_reader_in_chain = false;
|
2018-02-20 11:45:58 +00:00
|
|
|
bool is_initialized = false;
|
2022-04-11 13:43:09 +00:00
|
|
|
Names non_const_virtual_column_names;
|
2022-10-31 08:00:56 +00:00
|
|
|
|
|
|
|
Poco::Logger * log = &Poco::Logger::get("MergeTreeRangeReader");
|
2017-06-14 10:50:22 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
}
|