ClickHouse/dbms/src/Storages/MergeTree/MergeTreeReader.h

#pragma once

#include <Storages/MarkCache.h>
#include <Storages/MergeTree/MarkRange.h>
#include <Storages/MergeTree/MergeTreeData.h>
#include <Storages/MergeTree/MergeTreeRangeReader.h>
#include <IO/CompressedReadBufferFromFile.h>
#include <Core/NamesAndTypes.h>
#include <port/clock.h>

class CachedCompressedReadBuffer;

namespace DB
{

class IDataType;

/// Reads the data between pairs of marks in the same part. When reading consecutive ranges, avoids unnecessary seeks.
/// When ranges are almost consecutive, seeks are fast because they are performed inside the buffer.
/// Avoids loading the marks file if it is not needed (e.g. when reading the whole part).
class MergeTreeReader : private boost::noncopyable
{
public:
    using ValueSizeMap = std::map<std::string, double>;
    using DeserializeBinaryBulkStateMap = std::map<std::string, IDataType::DeserializeBinaryBulkStatePtr>;

    MergeTreeReader(const String & path, /// Path to the directory containing the part
        const MergeTreeData::DataPartPtr & data_part, const NamesAndTypesList & columns,
        UncompressedCache * uncompressed_cache,
        MarkCache * mark_cache,
        bool save_marks_in_cache,
        const MergeTreeData & storage, const MarkRanges & all_mark_ranges,
        size_t aio_threshold, size_t max_read_buffer_size,
        const ValueSizeMap & avg_value_size_hints = ValueSizeMap{},
        const ReadBufferFromFileBase::ProfileCallback & profile_callback = ReadBufferFromFileBase::ProfileCallback{},
        clockid_t clock_type = CLOCK_MONOTONIC_COARSE);

    ~MergeTreeReader();

    const ValueSizeMap & getAvgValueSizeHints() const;

    /// Add columns from ordered_names that are not present in the block.
    /// Missing columns are added in the order specified by ordered_names.
    /// If at least one column was added, reorders all columns in the block according to ordered_names.
    /// num_rows is needed in case block is empty.
    void fillMissingColumns(Block & res, bool & should_reorder, bool & should_evaluate_missing_defaults, size_t num_rows);
    /// Sort columns to ensure consistent order among all blocks.
    /// If filter_name is not nullptr and block has filter column, move it to the end of block.
    void reorderColumns(Block & res, const Names & ordered_names, const String * filter_name);
    /// Evaluate defaulted columns if necessary.
    void evaluateMissingDefaults(Block & res);

    const NamesAndTypesList & getColumns() const { return columns; }

    /// Return the number of rows has been read or zero if there is no columns to read.
    /// If continue_reading is true, continue reading from last state, otherwise seek to from_mark
    size_t readRows(size_t from_mark, bool continue_reading, size_t max_rows_to_read, Block & res);

private:
    class Stream
    {
    public:
        Stream(
            const String & path_prefix_, const String & extension_, size_t marks_count_,
            const MarkRanges & all_mark_ranges,
            MarkCache * mark_cache, bool save_marks_in_cache,
            UncompressedCache * uncompressed_cache,
            size_t aio_threshold, size_t max_read_buffer_size,
            const ReadBufferFromFileBase::ProfileCallback & profile_callback, clockid_t clock_type);

        void seekToMark(size_t index);
        void seekToStart();

        ReadBuffer * data_buffer;

    private:
        Stream() = default;

        /// NOTE: lazily loads marks from the marks cache.
        const MarkInCompressedFile & getMark(size_t index);

        void loadMarks();

        std::string path_prefix;
        std::string extension;

        size_t marks_count;

        MarkCache * mark_cache;
        bool save_marks_in_cache;
        MarkCache::MappedPtr marks;


        std::unique_ptr<CachedCompressedReadBuffer> cached_buffer;
        std::unique_ptr<CompressedReadBufferFromFile> non_cached_buffer;
    };

    using FileStreams = std::map<std::string, std::unique_ptr<Stream>>;

    /// avg_value_size_hints are used to reduce the number of reallocations when creating columns of variable size.
    ValueSizeMap avg_value_size_hints;
    /// Stores states for IDataType::deserializeBinaryBulk
    DeserializeBinaryBulkStateMap deserialize_binary_bulk_state_map;
    /// Path to the directory containing the part
    String path;
    MergeTreeData::DataPartPtr data_part;

    FileStreams streams;

    /// Columns that are read.
    NamesAndTypesList columns;

    UncompressedCache * uncompressed_cache;
    MarkCache * mark_cache;
    /// If save_marks_in_cache is false, then, if marks are not in cache, we will load them but won't save in the cache, to avoid evicting other data.
    bool save_marks_in_cache;

    const MergeTreeData & storage;
    MarkRanges all_mark_ranges;
    size_t aio_threshold;
    size_t max_read_buffer_size;
    size_t index_granularity;

    void addStreams(const String & name, const IDataType & type,
        const MarkRanges & all_mark_ranges, const ReadBufferFromFileBase::ProfileCallback & profile_callback, clockid_t clock_type);

    void readData(
        const String & name, const IDataType & type, IColumn & column,
        size_t from_mark, bool continue_reading, size_t max_rows_to_read,
        bool read_offsets = true);


    friend class MergeTreeRangeReader::DelayedStream;
};

}
Merge 2013-11-26 11:55:11 +00:00			`#pragma once`

Moved headers and sources to same place [#CLICKHOUSE-3]. 2017-04-01 09:19:00 +00:00			`#include <Storages/MarkCache.h>`
			`#include <Storages/MergeTree/MarkRange.h>`
			`#include <Storages/MergeTree/MergeTreeData.h>`
added MergeTreeRangeReader 2017-06-14 10:50:22 +00:00			`#include <Storages/MergeTree/MergeTreeRangeReader.h>`
Remove dump code 2018-12-20 17:37:02 +00:00			`#include <IO/CompressedReadBufferFromFile.h>`
Moved headers and sources to same place [#CLICKHOUSE-3]. 2017-04-01 09:19:00 +00:00			`#include <Core/NamesAndTypes.h>`
CLICKHOUSE-3762 Build fixes (#2488) CONTRIB-254 2018-06-19 18:09:09 +00:00			`#include <port/clock.h>`
Merge 2013-11-26 11:55:11 +00:00
Remove dump code 2018-12-20 17:37:02 +00:00			`class CachedCompressedReadBuffer;`
Merge 2013-11-26 11:55:11 +00:00
			`namespace DB`
			`{`

Better [#METR-2944]. 2016-11-20 12:43:20 +00:00			`class IDataType;`
translate comments [#CLICKHOUSE-3] 2017-01-24 17:25:47 +00:00
			`/// Reads the data between pairs of marks in the same part. When reading consecutive ranges, avoids unnecessary seeks.`
			`/// When ranges are almost consecutive, seeks are fast because they are performed inside the buffer.`
			`/// Avoids loading the marks file if it is not needed (e.g. when reading the whole part).`
Merge branch 'master' into METR-19266 Conflicts: dbms/CMakeLists.txt dbms/include/DB/Functions/FunctionsArray.h dbms/include/DB/Functions/FunctionsString.h dbms/include/DB/Parsers/ExpressionListParsers.h dbms/include/DB/Storages/MergeTree/MergeTreeBlockInputStream.h dbms/include/DB/Storages/MergeTree/MergeTreeReader.h dbms/include/DB/Storages/MergeTree/MergeTreeThreadBlockInputStream.h dbms/include/DB/Storages/MergeTree/MergedBlockOutputStream.h dbms/src/Core/ErrorCodes.cpp dbms/src/Parsers/ASTFunction.cpp dbms/src/Storages/MergeTree/MergeTreeData.cpp dbms/src/Storages/MergeTree/MergeTreeDataPart.cpp dbms/src/Storages/MergeTree/MergeTreeReader.cpp dbms/src/Storages/StorageLog.cpp 2016-12-10 04:51:36 +00:00			`class MergeTreeReader : private boost::noncopyable`
Merge 2013-11-26 11:55:11 +00:00			`{`
			`public:`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`using ValueSizeMap = std::map<std::string, double>;`
Added DeserializeBinaryBulkState which stores reading state for ColumnWithDictionary. 2018-05-21 16:21:15 +00:00			`using DeserializeBinaryBulkStateMap = std::map<std::string, IDataType::DeserializeBinaryBulkStatePtr>;`
dbms: added backoff on slow reads [#METR-17579]. 2015-12-13 04:52:13 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`MergeTreeReader(const String & path, /// Path to the directory containing the part`
Revert "Removed questionable code (2) [#CLICKHOUSE-2]." This reverts commit fcabe8b8886720da24208b12e176f0d09f408698. 2017-12-25 21:57:29 +00:00			`const MergeTreeData::DataPartPtr & data_part, const NamesAndTypesList & columns,`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`UncompressedCache * uncompressed_cache,`
			`MarkCache * mark_cache,`
			`bool save_marks_in_cache,`
Presumably better #2278 2018-10-17 03:13:00 +00:00			`const MergeTreeData & storage, const MarkRanges & all_mark_ranges,`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`size_t aio_threshold, size_t max_read_buffer_size,`
			`const ValueSizeMap & avg_value_size_hints = ValueSizeMap{},`
			`const ReadBufferFromFileBase::ProfileCallback & profile_callback = ReadBufferFromFileBase::ProfileCallback{},`
			`clockid_t clock_type = CLOCK_MONOTONIC_COARSE);`
Merge 2014-07-23 15:24:45 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`~MergeTreeReader();`
Merge 2013-11-26 11:55:11 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`const ValueSizeMap & getAvgValueSizeHints() const;`
Merge 2015-09-16 17:49:08 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`/// Add columns from ordered_names that are not present in the block.`
			`/// Missing columns are added in the order specified by ordered_names.`
			`/// If at least one column was added, reorders all columns in the block according to ordered_names.`
Fix readnig missing column with prewhere. #2827 2018-10-03 13:55:21 +00:00			`/// num_rows is needed in case block is empty.`
			`void fillMissingColumns(Block & res, bool & should_reorder, bool & should_evaluate_missing_defaults, size_t num_rows);`
fix continueReadingChain from several mark ranges 2018-02-22 12:43:57 +00:00			`/// Sort columns to ensure consistent order among all blocks.`
added comments and fixed tests build 2018-04-23 19:05:46 +00:00			`/// If filter_name is not nullptr and block has filter column, move it to the end of block.`
fix test [#CLICKHOUSE-3694] #2156 2018-04-16 12:21:36 +00:00			`void reorderColumns(Block & res, const Names & ordered_names, const String * filter_name);`
fix continueReadingChain from several mark ranges 2018-02-22 12:43:57 +00:00			`/// Evaluate defaulted columns if necessary.`
			`void evaluateMissingDefaults(Block & res);`
Merge 2014-12-04 15:50:48 +00:00
added MergeTreePrewhereRangeReader 2018-02-13 19:34:15 +00:00			`const NamesAndTypesList & getColumns() const { return columns; }`

Trying to simplify merge reading logic 2018-11-28 15:05:28 +00:00			`/// Return the number of rows has been read or zero if there is no columns to read.`
			`/// If continue_reading is true, continue reading from last state, otherwise seek to from_mark`
			`size_t readRows(size_t from_mark, bool continue_reading, size_t max_rows_to_read, Block & res);`

dbms: cleanup [#METR-19266] 2016-07-19 10:57:57 +00:00			`private:`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`class Stream`
			`{`
			`public:`
			`Stream(`
			`const String & path_prefix_, const String & extension_, size_t marks_count_,`
			`const MarkRanges & all_mark_ranges,`
			`MarkCache * mark_cache, bool save_marks_in_cache,`
			`UncompressedCache * uncompressed_cache,`
			`size_t aio_threshold, size_t max_read_buffer_size,`
			`const ReadBufferFromFileBase::ProfileCallback & profile_callback, clockid_t clock_type);`
Merge 2013-11-26 11:55:11 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`void seekToMark(size_t index);`
Make DatsTypeWithDictionary independent from index type. 2018-07-09 18:19:03 +00:00			`void seekToStart();`
Merge 2013-11-26 11:55:11 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`ReadBuffer * data_buffer;`
Better diagnostics [#METR-21183]. 2016-05-04 18:04:36 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`private:`
			`Stream() = default;`
Merge branch 'master' into METR-19266 Conflicts: dbms/CMakeLists.txt dbms/include/DB/Functions/FunctionsArray.h dbms/include/DB/Functions/FunctionsString.h dbms/include/DB/Parsers/ExpressionListParsers.h dbms/include/DB/Storages/MergeTree/MergeTreeBlockInputStream.h dbms/include/DB/Storages/MergeTree/MergeTreeReader.h dbms/include/DB/Storages/MergeTree/MergeTreeThreadBlockInputStream.h dbms/include/DB/Storages/MergeTree/MergedBlockOutputStream.h dbms/src/Core/ErrorCodes.cpp dbms/src/Parsers/ASTFunction.cpp dbms/src/Storages/MergeTree/MergeTreeData.cpp dbms/src/Storages/MergeTree/MergeTreeDataPart.cpp dbms/src/Storages/MergeTree/MergeTreeReader.cpp dbms/src/Storages/StorageLog.cpp 2016-12-10 04:51:36 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`/// NOTE: lazily loads marks from the marks cache.`
			`const MarkInCompressedFile & getMark(size_t index);`
do not load marks when reading the whole part [#CLICKHOUSE-2116] 2017-01-19 11:40:06 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`void loadMarks();`
do not load marks when reading the whole part [#CLICKHOUSE-2116] 2017-01-19 11:40:06 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`std::string path_prefix;`
			`std::string extension;`
do not load marks when reading the whole part [#CLICKHOUSE-2116] 2017-01-19 11:40:06 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`size_t marks_count;`
do not load marks when reading the whole part [#CLICKHOUSE-2116] 2017-01-19 11:40:06 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`MarkCache * mark_cache;`
			`bool save_marks_in_cache;`
			`MarkCache::MappedPtr marks;`
do not load marks when reading the whole part [#CLICKHOUSE-2116] 2017-01-19 11:40:06 +00:00
Remove dump code 2018-12-20 17:37:02 +00:00
			`std::unique_ptr<CachedCompressedReadBuffer> cached_buffer;`
			`std::unique_ptr<CompressedReadBufferFromFile> non_cached_buffer;`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`};`
Merge 2013-11-26 11:55:11 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`using FileStreams = std::map<std::string, std::unique_ptr<Stream>>;`
Merge 2013-11-26 11:55:11 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`/// avg_value_size_hints are used to reduce the number of reallocations when creating columns of variable size.`
			`ValueSizeMap avg_value_size_hints;`
Added DeserializeBinaryBulkState which stores reading state for ColumnWithDictionary. 2018-05-21 16:21:15 +00:00			`/// Stores states for IDataType::deserializeBinaryBulk`
			`DeserializeBinaryBulkStateMap deserialize_binary_bulk_state_map;`
[WIP] CLICKHOUSE-3943: Store last_readed_mark in MergeTreeThreadBlockInputStream and don't recreate reader if it stopped in appropriate position 2018-10-03 17:10:23 +00:00			`/// Path to the directory containing the part`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`String path;`
			`MergeTreeData::DataPartPtr data_part;`
use common cur_mark_idx for all streams [#CLICKHOUSE-2116] 2017-01-24 20:44:12 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`FileStreams streams;`
dbms: removed dead code; healing corrupted nested columns [#METR-15896]. 2015-04-09 00:37:08 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`/// Columns that are read.`
Revert "Removed questionable code (2) [#CLICKHOUSE-2]." This reverts commit fcabe8b8886720da24208b12e176f0d09f408698. 2017-12-25 21:57:29 +00:00			`NamesAndTypesList columns;`
dbms: removed dead code; healing corrupted nested columns [#METR-15896]. 2015-04-09 00:37:08 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`UncompressedCache * uncompressed_cache;`
			`MarkCache * mark_cache;`
			`/// If save_marks_in_cache is false, then, if marks are not in cache, we will load them but won't save in the cache, to avoid evicting other data.`
			`bool save_marks_in_cache;`
dbms: cut dependencies [#METR-2944]. 2015-04-16 06:12:35 +00:00
Presumably better #2278 2018-10-17 03:13:00 +00:00			`const MergeTreeData & storage;`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`MarkRanges all_mark_ranges;`
			`size_t aio_threshold;`
			`size_t max_read_buffer_size;`
Per granula reading for ColumnWithDictionary in MergeTreeRangeReader. 2018-05-21 14:15:55 +00:00			`size_t index_granularity;`
Merge 2013-11-26 11:55:11 +00:00
Remove dump code 2018-12-20 17:37:02 +00:00			`void addStreams(const String & name, const IDataType & type,`
ISSUES-838 add lz4、none、zstd codec 2018-10-11 02:57:48 +00:00			`const MarkRanges & all_mark_ranges, const ReadBufferFromFileBase::ProfileCallback & profile_callback, clockid_t clock_type);`
dbms: removed dead code; healing corrupted nested columns [#METR-15896]. 2015-04-09 00:37:08 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`void readData(`
			`const String & name, const IDataType & type, IColumn & column,`
refactoring and more comments in MergeTreeBaseBlockInputStream [#CLICKHOUSE-3065] 2017-07-11 09:32:39 +00:00			`size_t from_mark, bool continue_reading, size_t max_rows_to_read,`
Unification of data types, that is serialized with multiple streams [#CLICKHOUSE-2838]. 2017-08-07 07:31:16 +00:00			`bool read_offsets = true);`
dbms: fixed error [#METR-15804]. 2015-04-02 03:08:43 +00:00
added MergeTreeRangeReader 2017-06-14 10:50:22 +00:00
updated MergeTreePrewhereRangeReader; renamed MergeTreePrewhereRangeReader to MergeTreeRangeReader 2018-02-20 11:45:58 +00:00			`friend class MergeTreeRangeReader::DelayedStream;`
Merge 2013-11-26 11:55:11 +00:00			`};`

			`}`