ClickHouse/src/Storages/System/StorageSystemZeros.cpp

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

136 lines
3.3 KiB
C++
Raw Normal View History

2020-03-10 13:01:29 +00:00
#include <Storages/System/StorageSystemZeros.h>
2022-05-20 19:49:31 +00:00
#include <Processors/ISource.h>
2021-10-16 14:03:50 +00:00
#include <QueryPipeline/Pipe.h>
2020-03-10 13:01:29 +00:00
#include <DataTypes/DataTypesNumber.h>
#include <Columns/ColumnsNumber.h>
namespace DB
{
namespace
{
struct ZerosState
{
std::atomic<UInt64> num_generated_rows = 0;
};
using ZerosStatePtr = std::shared_ptr<ZerosState>;
/// Source which generates zeros.
/// Uses state to share the number of generated rows between threads.
/// If state is nullptr, then limit is ignored.
2022-05-20 19:49:31 +00:00
class ZerosSource : public ISource
2020-03-10 13:01:29 +00:00
{
public:
ZerosSource(UInt64 block_size, UInt64 limit_, ZerosStatePtr state_)
2022-05-20 19:49:31 +00:00
: ISource(createHeader()), limit(limit_), state(std::move(state_))
2020-03-10 13:01:29 +00:00
{
column = createColumn(block_size);
}
String getName() const override { return "Zeros"; }
protected:
Chunk generate() override
{
auto column_ptr = column;
size_t column_size = column_ptr->size();
if (state)
{
auto generated_rows = state->num_generated_rows.fetch_add(column_size, std::memory_order_acquire);
if (generated_rows >= limit)
return {};
if (generated_rows + column_size > limit)
{
column_size = limit - generated_rows;
column_ptr = createColumn(column_size);
}
}
2022-05-24 19:29:00 +00:00
progress(column->size(), column->byteSize());
2020-03-10 13:01:29 +00:00
return { Columns {std::move(column_ptr)}, column_size };
}
private:
UInt64 limit;
ZerosStatePtr state;
ColumnPtr column;
static Block createHeader()
{
2020-03-10 17:42:31 +00:00
return { ColumnWithTypeAndName(ColumnUInt8::create(), std::make_shared<DataTypeUInt8>(), "zero") };
2020-03-10 13:01:29 +00:00
}
static ColumnPtr createColumn(size_t size)
{
auto column_ptr = ColumnUInt8::create();
/// It is probably the fastest method to create zero column, cause resize_fill uses memset internally.
column_ptr->getData().resize_fill(size);
return column_ptr;
}
};
}
StorageSystemZeros::StorageSystemZeros(const StorageID & table_id_, bool multithreaded_, std::optional<UInt64> limit_)
: IStorage(table_id_), multithreaded(multithreaded_), limit(limit_)
2020-03-10 13:01:29 +00:00
{
2020-06-19 15:39:41 +00:00
StorageInMemoryMetadata storage_metadata;
storage_metadata.setColumns(ColumnsDescription({{"zero", std::make_shared<DataTypeUInt8>()}}));
setInMemoryMetadata(storage_metadata);
2020-03-10 13:01:29 +00:00
}
2020-08-06 12:24:05 +00:00
Pipe StorageSystemZeros::read(
const Names & column_names,
const StorageSnapshotPtr & storage_snapshot,
SelectQueryInfo &,
ContextPtr /*context*/,
QueryProcessingStage::Enum /*processed_stage*/,
size_t max_block_size,
unsigned num_streams)
2020-03-10 13:01:29 +00:00
{
storage_snapshot->check(column_names);
2020-03-10 13:01:29 +00:00
bool use_multiple_streams = multithreaded;
if (limit && *limit < max_block_size)
{
max_block_size = static_cast<size_t>(*limit);
use_multiple_streams = false;
}
if (!use_multiple_streams)
num_streams = 1;
2020-08-06 12:24:05 +00:00
Pipe res;
2020-03-10 13:01:29 +00:00
ZerosStatePtr state;
if (limit)
state = std::make_shared<ZerosState>();
for (size_t i = 0; i < num_streams; ++i)
{
2020-03-11 13:46:51 +00:00
auto source = std::make_shared<ZerosSource>(max_block_size, limit ? *limit : 0, state);
2020-03-10 13:01:29 +00:00
if (limit && i == 0)
source->addTotalRowsApprox(*limit);
2020-08-06 12:24:05 +00:00
res.addSource(std::move(source));
2020-03-10 13:01:29 +00:00
}
return res;
}
}