2020-02-11 18:27:52 +00:00
|
|
|
#pragma once
|
|
|
|
|
2020-02-17 17:08:31 +00:00
|
|
|
#include <mutex>
|
|
|
|
|
|
|
|
#include <Core/Block.h>
|
2020-02-11 18:27:52 +00:00
|
|
|
#include <Interpreters/IJoin.h>
|
2020-04-07 09:48:47 +00:00
|
|
|
#include <Interpreters/TableJoin.h>
|
2020-10-10 16:31:10 +00:00
|
|
|
#include <DataStreams/IBlockInputStream.h>
|
|
|
|
|
2020-02-11 18:27:52 +00:00
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2020-02-20 19:13:12 +00:00
|
|
|
/// Used when setting 'join_algorithm' set to JoinAlgorithm::AUTO.
|
|
|
|
/// Starts JOIN with join-in-memory algorithm and switches to join-on-disk on the fly if there's no memory to place right table.
|
|
|
|
/// Current join-in-memory and join-on-disk are JoinAlgorithm::HASH and JoinAlgorithm::PARTIAL_MERGE joins respectively.
|
2020-02-11 18:27:52 +00:00
|
|
|
class JoinSwitcher : public IJoin
|
|
|
|
{
|
|
|
|
public:
|
2020-04-07 09:48:47 +00:00
|
|
|
JoinSwitcher(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block_);
|
2020-02-11 18:27:52 +00:00
|
|
|
|
2021-03-25 18:11:54 +00:00
|
|
|
const TableJoin & getTableJoin() const override { return *table_join; }
|
|
|
|
|
2020-02-20 19:13:12 +00:00
|
|
|
/// Add block of data from right hand of JOIN into current join object.
|
|
|
|
/// If join-in-memory memory limit exceeded switches to join-on-disk and continue with it.
|
|
|
|
/// @returns false, if join-on-disk disk limit exceeded
|
2020-03-18 03:27:32 +00:00
|
|
|
bool addJoinedBlock(const Block & block, bool check_limits) override;
|
2020-02-11 18:27:52 +00:00
|
|
|
|
|
|
|
void joinBlock(Block & block, std::shared_ptr<ExtraBlock> & not_processed) override
|
|
|
|
{
|
|
|
|
join->joinBlock(block, not_processed);
|
|
|
|
}
|
|
|
|
|
2021-07-14 10:02:23 +00:00
|
|
|
const Block & getTotals() const override
|
2020-02-11 18:27:52 +00:00
|
|
|
{
|
2021-07-14 10:02:23 +00:00
|
|
|
return join->getTotals();
|
2020-02-11 18:27:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void setTotals(const Block & block) override
|
|
|
|
{
|
|
|
|
join->setTotals(block);
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t getTotalRowCount() const override
|
|
|
|
{
|
|
|
|
return join->getTotalRowCount();
|
|
|
|
}
|
|
|
|
|
2020-02-17 17:08:31 +00:00
|
|
|
size_t getTotalByteCount() const override
|
|
|
|
{
|
|
|
|
return join->getTotalByteCount();
|
|
|
|
}
|
|
|
|
|
2020-02-11 18:27:52 +00:00
|
|
|
bool alwaysReturnsEmptySet() const override
|
|
|
|
{
|
|
|
|
return join->alwaysReturnsEmptySet();
|
|
|
|
}
|
|
|
|
|
|
|
|
BlockInputStreamPtr createStreamWithNonJoinedRows(const Block & block, UInt64 max_block_size) const override
|
|
|
|
{
|
|
|
|
return join->createStreamWithNonJoinedRows(block, max_block_size);
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
JoinPtr join;
|
2020-02-18 14:19:13 +00:00
|
|
|
SizeLimits limits;
|
2020-02-20 17:19:16 +00:00
|
|
|
bool switched;
|
2020-02-17 17:08:31 +00:00
|
|
|
mutable std::mutex switch_mutex;
|
2020-04-07 09:48:47 +00:00
|
|
|
std::shared_ptr<TableJoin> table_join;
|
2020-02-18 12:41:23 +00:00
|
|
|
const Block right_sample_block;
|
2020-02-17 17:08:31 +00:00
|
|
|
|
2020-02-20 19:13:12 +00:00
|
|
|
/// Change join-in-memory to join-on-disk moving right hand JOIN data from one to another.
|
|
|
|
/// Throws an error if join-on-disk do not support JOIN kind or strictness.
|
2020-02-17 17:08:31 +00:00
|
|
|
void switchJoin();
|
2020-02-11 18:27:52 +00:00
|
|
|
};
|
|
|
|
|
2020-09-18 16:25:20 +00:00
|
|
|
|
|
|
|
/// Creates NonJoinedBlockInputStream on the first read. Allows to swap join algo before it.
|
|
|
|
class LazyNonJoinedBlockInputStream : public IBlockInputStream
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
LazyNonJoinedBlockInputStream(const IJoin & join_, const Block & block, UInt64 max_block_size_)
|
|
|
|
: join(join_)
|
|
|
|
, result_sample_block(block)
|
|
|
|
, max_block_size(max_block_size_)
|
|
|
|
{}
|
|
|
|
|
|
|
|
String getName() const override { return "LazyNonMergeJoined"; }
|
|
|
|
Block getHeader() const override { return result_sample_block; }
|
|
|
|
|
|
|
|
protected:
|
|
|
|
Block readImpl() override
|
|
|
|
{
|
|
|
|
if (!stream)
|
|
|
|
{
|
|
|
|
stream = join.createStreamWithNonJoinedRows(result_sample_block, max_block_size);
|
|
|
|
if (!stream)
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
return stream->read();
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
BlockInputStreamPtr stream;
|
|
|
|
const IJoin & join;
|
|
|
|
Block result_sample_block;
|
|
|
|
UInt64 max_block_size;
|
|
|
|
};
|
|
|
|
|
2020-02-11 18:27:52 +00:00
|
|
|
}
|