ClickHouse/dbms/src/Storages/MergeTree/MergeTreeSelectProcessor.h

79 lines
2.4 KiB
C++
Raw Normal View History

2013-04-24 10:31:32 +00:00
#pragma once
#include <DataStreams/IBlockInputStream.h>
2019-10-01 16:50:08 +00:00
#include <Storages/MergeTree/MergeTreeThreadSelectBlockInputProcessor.h>
#include <Storages/MergeTree/MergeTreeData.h>
#include <Storages/MergeTree/MarkRange.h>
#include <Storages/MergeTree/MergeTreeBlockReadUtils.h>
#include <Storages/SelectQueryInfo.h>
2013-04-24 10:31:32 +00:00
namespace DB
{
2018-11-29 09:19:42 +00:00
/// Used to read data from single part with select query
/// Cares about PREWHERE, virtual columns, indexes etc.
/// To read data from multiple parts, Storage (MergeTree) creates multiple such objects.
2019-10-01 16:50:08 +00:00
class MergeTreeSelectProcessor : public MergeTreeBaseSelectProcessor
2013-04-24 10:31:32 +00:00
{
public:
2019-10-01 16:50:08 +00:00
MergeTreeSelectProcessor(
2018-10-17 03:13:00 +00:00
const MergeTreeData & storage,
const MergeTreeData::DataPartPtr & owned_data_part,
2019-02-10 16:55:12 +00:00
UInt64 max_block_size_rows,
size_t preferred_block_size_bytes,
size_t preferred_max_column_in_block_size_bytes,
2019-08-03 11:02:40 +00:00
Names column_names_,
2019-10-04 15:40:05 +00:00
MarkRanges mark_ranges,
bool use_uncompressed_cache,
const PrewhereInfoPtr & prewhere_info,
bool check_columns,
size_t min_bytes_to_use_direct_io,
size_t min_bytes_to_use_mmap_io,
size_t max_read_buffer_size,
bool save_marks_in_cache,
2017-04-05 20:34:19 +00:00
const Names & virt_column_names = {},
size_t part_index_in_query = 0,
bool quiet = false);
2019-10-01 16:50:08 +00:00
~MergeTreeSelectProcessor() override;
String getName() const override { return "MergeTree"; }
/// Closes readers and unlock part locks
void finish();
2013-11-26 11:55:11 +00:00
protected:
2017-04-05 20:34:19 +00:00
bool getNewTask() override;
2013-04-24 10:31:32 +00:00
private:
/// Used by Task
2018-04-16 12:21:36 +00:00
Names required_columns;
2018-04-19 15:18:26 +00:00
/// Names from header. Used in order to order columns in read blocks.
Names ordered_names;
NameSet column_name_set;
2019-07-19 14:56:00 +00:00
MergeTreeReadTaskColumns task_columns;
/// Data part will not be removed if the pointer owns it
MergeTreeData::DataPartPtr data_part;
/// Forbids to change columns list of the part during reading
std::shared_lock<std::shared_mutex> part_columns_lock;
/// Mark ranges we should read (in ascending order)
MarkRanges all_mark_ranges;
2018-05-23 19:34:37 +00:00
/// Total number of marks we should read
size_t total_marks_count = 0;
/// Value of _part_index virtual column (used only in SelectExecutor)
2017-04-05 20:34:19 +00:00
size_t part_index_in_query = 0;
2017-04-05 20:34:19 +00:00
bool check_columns;
String path;
2017-04-05 20:34:19 +00:00
bool is_first_task = true;
2019-10-01 16:50:08 +00:00
Logger * log = &Logger::get("MergeTreeSelectProcessor");
2013-04-24 10:31:32 +00:00
};
}