2017-09-11 17:55:41 +00:00
|
|
|
#include <Storages/MergeTree/MergeTreePartition.h>
|
|
|
|
#include <Storages/MergeTree/MergeTreeData.h>
|
2019-10-10 16:30:30 +00:00
|
|
|
#include <Storages/MergeTree/IMergeTreeDataPart.h>
|
2017-09-11 17:55:41 +00:00
|
|
|
#include <IO/HashingWriteBuffer.h>
|
2017-11-24 13:55:31 +00:00
|
|
|
#include <Common/FieldVisitors.h>
|
2017-09-11 17:55:41 +00:00
|
|
|
#include <DataTypes/DataTypeDate.h>
|
2018-11-26 12:41:17 +00:00
|
|
|
#include <DataTypes/DataTypeTuple.h>
|
|
|
|
#include <Columns/ColumnTuple.h>
|
2017-09-11 17:55:41 +00:00
|
|
|
#include <Common/SipHash.h>
|
2021-06-14 04:13:35 +00:00
|
|
|
#include <Common/FieldVisitorToString.h>
|
|
|
|
#include <Common/FieldVisitorHash.h>
|
2017-09-11 17:55:41 +00:00
|
|
|
#include <Common/typeid_cast.h>
|
|
|
|
#include <Common/hex.h>
|
2019-01-25 15:17:12 +00:00
|
|
|
#include <Core/Block.h>
|
2017-09-11 17:55:41 +00:00
|
|
|
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
2021-06-09 23:58:51 +00:00
|
|
|
|
2020-02-25 18:10:48 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
|
|
|
extern const int LOGICAL_ERROR;
|
2021-11-26 14:49:31 +00:00
|
|
|
extern const int INVALID_PARTITION_VALUE;
|
2020-02-25 18:10:48 +00:00
|
|
|
}
|
2017-09-11 17:55:41 +00:00
|
|
|
|
2021-06-09 23:58:51 +00:00
|
|
|
namespace
|
|
|
|
{
|
|
|
|
/// This is a special visitor which is used to get partition ID.
|
|
|
|
/// Calculate hash for UUID the same way as for UInt128.
|
|
|
|
/// It worked this way until 21.5, and we cannot change it,
|
|
|
|
/// or partition ID will be different in case UUID is used in partition key.
|
|
|
|
/// (It is not recommended to use UUID as partition key).
|
2021-06-14 02:48:10 +00:00
|
|
|
/// NOTE: The code is intentionally copy-pasted,
|
|
|
|
/// so when FieldVisitorHash is changed, LegacyFieldVisitorHash will not change.
|
|
|
|
class LegacyFieldVisitorHash : public StaticVisitor<>
|
2021-06-09 23:58:51 +00:00
|
|
|
{
|
2021-06-14 02:48:10 +00:00
|
|
|
private:
|
|
|
|
SipHash & hash;
|
2021-06-09 23:58:51 +00:00
|
|
|
public:
|
2021-06-14 04:28:17 +00:00
|
|
|
explicit LegacyFieldVisitorHash(SipHash & hash_) : hash(hash_) {}
|
2021-06-14 02:48:10 +00:00
|
|
|
|
|
|
|
void operator() (const Null &) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Null;
|
|
|
|
hash.update(type);
|
|
|
|
}
|
|
|
|
void operator() (const UInt64 & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::UInt64;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x);
|
|
|
|
}
|
|
|
|
void operator() (const UInt128 & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::UInt128;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x);
|
|
|
|
}
|
|
|
|
void operator() (const UInt256 & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::UInt256;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x);
|
|
|
|
}
|
|
|
|
void operator() (const Int64 & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Int64;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x);
|
|
|
|
}
|
|
|
|
void operator() (const Int128 & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Int128;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x);
|
|
|
|
}
|
|
|
|
void operator() (const Int256 & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Int256;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x);
|
|
|
|
}
|
|
|
|
void operator() (const UUID & x) const
|
|
|
|
{
|
|
|
|
operator()(x.toUnderType());
|
|
|
|
}
|
|
|
|
void operator() (const Float64 & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Float64;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x);
|
|
|
|
}
|
|
|
|
void operator() (const String & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::String;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.size());
|
|
|
|
hash.update(x.data(), x.size());
|
|
|
|
}
|
|
|
|
void operator() (const Array & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Array;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.size());
|
|
|
|
|
|
|
|
for (const auto & elem : x)
|
|
|
|
applyVisitor(*this, elem);
|
|
|
|
}
|
|
|
|
void operator() (const Tuple & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Tuple;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.size());
|
|
|
|
|
|
|
|
for (const auto & elem : x)
|
|
|
|
applyVisitor(*this, elem);
|
|
|
|
}
|
|
|
|
void operator() (const Map & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Map;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.size());
|
|
|
|
|
|
|
|
for (const auto & elem : x)
|
|
|
|
applyVisitor(*this, elem);
|
|
|
|
}
|
2021-08-20 21:11:22 +00:00
|
|
|
void operator() (const Object & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Object;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.size());
|
|
|
|
|
|
|
|
for (const auto & [key, value]: x)
|
|
|
|
{
|
|
|
|
hash.update(key);
|
|
|
|
applyVisitor(*this, value);
|
|
|
|
}
|
|
|
|
}
|
2021-06-14 02:48:10 +00:00
|
|
|
void operator() (const DecimalField<Decimal32> & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Decimal32;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.getValue().value);
|
|
|
|
}
|
|
|
|
void operator() (const DecimalField<Decimal64> & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Decimal64;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.getValue().value);
|
|
|
|
}
|
|
|
|
void operator() (const DecimalField<Decimal128> & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Decimal128;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.getValue().value);
|
|
|
|
}
|
|
|
|
void operator() (const DecimalField<Decimal256> & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::Decimal256;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.getValue().value);
|
|
|
|
}
|
|
|
|
void operator() (const AggregateFunctionStateData & x) const
|
|
|
|
{
|
|
|
|
UInt8 type = Field::Types::AggregateFunctionState;
|
|
|
|
hash.update(type);
|
|
|
|
hash.update(x.name.size());
|
|
|
|
hash.update(x.name.data(), x.name.size());
|
|
|
|
hash.update(x.data.size());
|
|
|
|
hash.update(x.data.data(), x.data.size());
|
|
|
|
}
|
2021-06-09 23:58:51 +00:00
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2020-02-27 16:47:40 +00:00
|
|
|
static std::unique_ptr<ReadBufferFromFileBase> openForReading(const DiskPtr & disk, const String & path)
|
2017-09-11 17:55:41 +00:00
|
|
|
{
|
2021-08-16 00:00:32 +00:00
|
|
|
size_t file_size = disk->getFileSize(path);
|
2021-08-24 21:45:58 +00:00
|
|
|
return disk->readFile(path, ReadSettings().adjustBufferSize(file_size), file_size);
|
2017-09-11 17:55:41 +00:00
|
|
|
}
|
|
|
|
|
2019-01-25 15:17:12 +00:00
|
|
|
String MergeTreePartition::getID(const MergeTreeData & storage) const
|
|
|
|
{
|
2020-06-17 10:34:23 +00:00
|
|
|
return getID(storage.getInMemoryMetadataPtr()->getPartitionKey().sample_block);
|
2019-01-25 15:17:12 +00:00
|
|
|
}
|
|
|
|
|
2017-09-13 16:22:04 +00:00
|
|
|
/// NOTE: This ID is used to create part names which are then persisted in ZK and as directory names on the file system.
|
|
|
|
/// So if you want to change this method, be sure to guarantee compatibility with existing table data.
|
2019-01-25 15:17:12 +00:00
|
|
|
String MergeTreePartition::getID(const Block & partition_key_sample) const
|
2017-09-11 17:55:41 +00:00
|
|
|
{
|
2019-01-25 15:17:12 +00:00
|
|
|
if (value.size() != partition_key_sample.columns())
|
2017-09-11 17:55:41 +00:00
|
|
|
throw Exception("Invalid partition key size: " + toString(value.size()), ErrorCodes::LOGICAL_ERROR);
|
|
|
|
|
|
|
|
if (value.empty())
|
2017-09-13 16:22:04 +00:00
|
|
|
return "all"; /// It is tempting to use an empty string here. But that would break directory structure in ZK.
|
2017-09-11 17:55:41 +00:00
|
|
|
|
2017-09-13 16:22:04 +00:00
|
|
|
/// In case all partition fields are represented by integral types, try to produce a human-readable ID.
|
2017-09-11 17:55:41 +00:00
|
|
|
/// Otherwise use a hex-encoded hash.
|
2021-11-26 14:49:31 +00:00
|
|
|
/// NOTE It will work in unexpected way if some partition key column is Nullable:
|
|
|
|
/// are_all_integral will be false if some value is NULL. Maybe we should fix it.
|
2017-09-11 17:55:41 +00:00
|
|
|
bool are_all_integral = true;
|
|
|
|
for (const Field & field : value)
|
|
|
|
{
|
|
|
|
if (field.getType() != Field::Types::UInt64 && field.getType() != Field::Types::Int64)
|
|
|
|
{
|
|
|
|
are_all_integral = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
String result;
|
|
|
|
|
|
|
|
if (are_all_integral)
|
|
|
|
{
|
|
|
|
FieldVisitorToString to_string_visitor;
|
|
|
|
for (size_t i = 0; i < value.size(); ++i)
|
|
|
|
{
|
|
|
|
if (i > 0)
|
|
|
|
result += '-';
|
|
|
|
|
2019-01-25 15:17:12 +00:00
|
|
|
if (typeid_cast<const DataTypeDate *>(partition_key_sample.getByPosition(i).type.get()))
|
2018-05-25 13:29:15 +00:00
|
|
|
result += toString(DateLUT::instance().toNumYYYYMMDD(DayNum(value[i].safeGet<UInt64>())));
|
2017-09-11 17:55:41 +00:00
|
|
|
else
|
|
|
|
result += applyVisitor(to_string_visitor, value[i]);
|
2017-09-13 16:22:04 +00:00
|
|
|
|
|
|
|
/// It is tempting to output DateTime as YYYYMMDDhhmmss, but that would make partition ID
|
|
|
|
/// timezone-dependent.
|
2017-09-11 17:55:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
SipHash hash;
|
2021-06-09 13:51:40 +00:00
|
|
|
LegacyFieldVisitorHash hashing_visitor(hash);
|
2017-09-11 17:55:41 +00:00
|
|
|
for (const Field & field : value)
|
|
|
|
applyVisitor(hashing_visitor, field);
|
|
|
|
|
|
|
|
char hash_data[16];
|
|
|
|
hash.get128(hash_data);
|
|
|
|
result.resize(32);
|
|
|
|
for (size_t i = 0; i < 16; ++i)
|
|
|
|
writeHexByteLowercase(hash_data[i], &result[2 * i]);
|
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2021-11-26 14:49:31 +00:00
|
|
|
std::optional<Row> MergeTreePartition::tryParseValueFromID(const String & partition_id, const Block & partition_key_sample)
|
|
|
|
{
|
|
|
|
size_t num_keys = partition_key_sample.columns();
|
|
|
|
Row res;
|
|
|
|
res.reserve(num_keys);
|
|
|
|
|
|
|
|
ReadBufferFromString buf(partition_id);
|
|
|
|
if (num_keys == 0)
|
|
|
|
{
|
|
|
|
checkString("all", buf);
|
|
|
|
assertEOF(buf);
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
enum KeyType { DATE, UNSIGNED, SIGNED };
|
|
|
|
|
|
|
|
std::vector<KeyType> key_types;
|
|
|
|
key_types.reserve(num_keys);
|
|
|
|
for (size_t i = 0; i < num_keys; ++i)
|
|
|
|
{
|
|
|
|
auto type = partition_key_sample.getByPosition(i).type;
|
|
|
|
|
|
|
|
/// NOTE Sometimes it's possible to parse Nullable key, but easier to ignore it.
|
|
|
|
if (type->isNullable())
|
|
|
|
return {};
|
|
|
|
|
|
|
|
/// We use Field::Types when serializing partition_id, let's get some Field to check type
|
|
|
|
Field sample_field = type->getDefault();
|
|
|
|
|
|
|
|
if (typeid_cast<const DataTypeDate *>(type.get()))
|
|
|
|
key_types.emplace_back(DATE);
|
|
|
|
else if (sample_field.getType() == Field::Types::UInt64)
|
|
|
|
key_types.emplace_back(UNSIGNED);
|
|
|
|
else if (sample_field.getType() == Field::Types::Int64)
|
|
|
|
key_types.emplace_back(SIGNED);
|
|
|
|
else
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
/// All columns are numeric, will parse partition value
|
|
|
|
for (size_t i = 0; i < num_keys; ++i)
|
|
|
|
{
|
2021-11-30 12:29:05 +00:00
|
|
|
switch (key_types[i])
|
2021-11-26 14:49:31 +00:00
|
|
|
{
|
2021-11-30 12:29:05 +00:00
|
|
|
case DATE:
|
|
|
|
{
|
|
|
|
UInt32 date_yyyymmdd;
|
|
|
|
readText(date_yyyymmdd, buf);
|
|
|
|
constexpr UInt32 min_yyyymmdd = 10000000;
|
|
|
|
constexpr UInt32 max_yyyymmdd = 99999999;
|
|
|
|
if (date_yyyymmdd < min_yyyymmdd || max_yyyymmdd < date_yyyymmdd)
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::INVALID_PARTITION_VALUE, "Cannot parse partition_id: got unexpected Date: {}", date_yyyymmdd);
|
|
|
|
|
|
|
|
UInt32 date = DateLUT::instance().YYYYMMDDToDayNum(date_yyyymmdd);
|
|
|
|
res.emplace_back(date);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case UNSIGNED:
|
|
|
|
{
|
|
|
|
UInt64 value;
|
|
|
|
readText(value, buf);
|
|
|
|
res.emplace_back(value);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case SIGNED:
|
|
|
|
{
|
|
|
|
Int64 value;
|
|
|
|
readText(value, buf);
|
|
|
|
res.emplace_back(value);
|
|
|
|
break;
|
|
|
|
}
|
2021-11-26 14:49:31 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (i + 1 != num_keys)
|
|
|
|
assertChar('-', buf);
|
|
|
|
}
|
|
|
|
|
|
|
|
assertEOF(buf);
|
|
|
|
|
|
|
|
String expected_partition_id = MergeTreePartition{res}.getID(partition_key_sample);
|
|
|
|
if (expected_partition_id != partition_id)
|
|
|
|
throw Exception(ErrorCodes::LOGICAL_ERROR, "Partition ID was parsed incorrectly: expected {}, got {}",
|
|
|
|
expected_partition_id, partition_id);
|
|
|
|
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2018-10-09 18:32:44 +00:00
|
|
|
void MergeTreePartition::serializeText(const MergeTreeData & storage, WriteBuffer & out, const FormatSettings & format_settings) const
|
2017-09-11 17:55:41 +00:00
|
|
|
{
|
2020-06-24 14:12:44 +00:00
|
|
|
auto metadata_snapshot = storage.getInMemoryMetadataPtr();
|
|
|
|
const auto & partition_key_sample = metadata_snapshot->getPartitionKey().sample_block;
|
2020-05-20 12:16:55 +00:00
|
|
|
size_t key_size = partition_key_sample.columns();
|
2017-09-11 17:55:41 +00:00
|
|
|
|
|
|
|
if (key_size == 0)
|
|
|
|
{
|
|
|
|
writeCString("tuple()", out);
|
|
|
|
}
|
2018-10-09 18:32:44 +00:00
|
|
|
else if (key_size == 1)
|
2017-09-11 17:55:41 +00:00
|
|
|
{
|
2020-05-20 12:16:55 +00:00
|
|
|
const DataTypePtr & type = partition_key_sample.getByPosition(0).type;
|
2017-12-15 20:48:46 +00:00
|
|
|
auto column = type->createColumn();
|
2018-10-09 18:32:44 +00:00
|
|
|
column->insert(value[0]);
|
2021-03-09 14:46:52 +00:00
|
|
|
type->getDefaultSerialization()->serializeText(*column, 0, out, format_settings);
|
2017-09-11 17:55:41 +00:00
|
|
|
}
|
2018-10-09 18:32:44 +00:00
|
|
|
else
|
|
|
|
{
|
2018-11-26 12:41:17 +00:00
|
|
|
DataTypes types;
|
|
|
|
Columns columns;
|
2018-10-09 18:32:44 +00:00
|
|
|
for (size_t i = 0; i < key_size; ++i)
|
|
|
|
{
|
2020-05-20 12:16:55 +00:00
|
|
|
const auto & type = partition_key_sample.getByPosition(i).type;
|
2018-11-26 12:41:17 +00:00
|
|
|
types.push_back(type);
|
2018-10-09 18:32:44 +00:00
|
|
|
auto column = type->createColumn();
|
|
|
|
column->insert(value[i]);
|
2018-11-26 12:41:17 +00:00
|
|
|
columns.push_back(std::move(column));
|
2018-10-09 18:32:44 +00:00
|
|
|
}
|
2017-09-11 17:55:41 +00:00
|
|
|
|
2021-03-09 14:46:52 +00:00
|
|
|
auto tuple_serialization = DataTypeTuple(types).getDefaultSerialization();
|
2018-11-26 12:41:17 +00:00
|
|
|
auto tuple_column = ColumnTuple::create(columns);
|
2021-03-09 14:46:52 +00:00
|
|
|
tuple_serialization->serializeText(*tuple_column, 0, out, format_settings);
|
2018-10-09 18:32:44 +00:00
|
|
|
}
|
2017-09-11 17:55:41 +00:00
|
|
|
}
|
|
|
|
|
2020-02-27 16:47:40 +00:00
|
|
|
void MergeTreePartition::load(const MergeTreeData & storage, const DiskPtr & disk, const String & part_path)
|
2017-09-11 17:55:41 +00:00
|
|
|
{
|
2020-06-17 10:34:23 +00:00
|
|
|
auto metadata_snapshot = storage.getInMemoryMetadataPtr();
|
|
|
|
if (!metadata_snapshot->hasPartitionKey())
|
2017-09-11 17:55:41 +00:00
|
|
|
return;
|
|
|
|
|
2021-05-22 16:19:56 +00:00
|
|
|
const auto & partition_key_sample = adjustPartitionKey(metadata_snapshot, storage.getContext()).sample_block;
|
2020-02-27 16:47:40 +00:00
|
|
|
auto partition_file_path = part_path + "partition.dat";
|
|
|
|
auto file = openForReading(disk, partition_file_path);
|
2020-05-20 12:16:55 +00:00
|
|
|
value.resize(partition_key_sample.columns());
|
|
|
|
for (size_t i = 0; i < partition_key_sample.columns(); ++i)
|
2021-05-22 16:19:56 +00:00
|
|
|
partition_key_sample.getByPosition(i).type->getDefaultSerialization()->deserializeBinary(value[i], *file);
|
2017-09-11 17:55:41 +00:00
|
|
|
}
|
|
|
|
|
2020-02-27 16:47:40 +00:00
|
|
|
void MergeTreePartition::store(const MergeTreeData & storage, const DiskPtr & disk, const String & part_path, MergeTreeDataPartChecksums & checksums) const
|
2017-09-11 17:55:41 +00:00
|
|
|
{
|
2020-06-24 16:06:01 +00:00
|
|
|
auto metadata_snapshot = storage.getInMemoryMetadataPtr();
|
2021-05-22 16:19:56 +00:00
|
|
|
const auto & partition_key_sample = adjustPartitionKey(metadata_snapshot, storage.getContext()).sample_block;
|
2020-06-24 16:06:01 +00:00
|
|
|
store(partition_key_sample, disk, part_path, checksums);
|
2019-01-25 15:17:12 +00:00
|
|
|
}
|
|
|
|
|
2020-02-27 16:47:40 +00:00
|
|
|
void MergeTreePartition::store(const Block & partition_key_sample, const DiskPtr & disk, const String & part_path, MergeTreeDataPartChecksums & checksums) const
|
2019-01-25 15:17:12 +00:00
|
|
|
{
|
|
|
|
if (!partition_key_sample)
|
2017-09-11 17:55:41 +00:00
|
|
|
return;
|
|
|
|
|
2020-02-27 16:47:40 +00:00
|
|
|
auto out = disk->writeFile(part_path + "partition.dat");
|
|
|
|
HashingWriteBuffer out_hashing(*out);
|
2017-09-11 17:55:41 +00:00
|
|
|
for (size_t i = 0; i < value.size(); ++i)
|
2021-05-17 14:33:04 +00:00
|
|
|
partition_key_sample.getByPosition(i).type->getDefaultSerialization()->serializeBinary(value[i], out_hashing);
|
2021-05-15 18:32:20 +00:00
|
|
|
|
2017-10-24 14:11:53 +00:00
|
|
|
out_hashing.next();
|
2017-09-11 17:55:41 +00:00
|
|
|
checksums.files["partition.dat"].file_size = out_hashing.count();
|
|
|
|
checksums.files["partition.dat"].file_hash = out_hashing.getHash();
|
2020-10-06 09:38:00 +00:00
|
|
|
out->finalize();
|
2017-09-11 17:55:41 +00:00
|
|
|
}
|
|
|
|
|
2021-05-21 16:14:01 +00:00
|
|
|
void MergeTreePartition::create(const StorageMetadataPtr & metadata_snapshot, Block block, size_t row, ContextPtr context)
|
2020-05-05 15:06:16 +00:00
|
|
|
{
|
2020-06-26 11:30:23 +00:00
|
|
|
if (!metadata_snapshot->hasPartitionKey())
|
2020-06-03 13:27:54 +00:00
|
|
|
return;
|
|
|
|
|
2021-05-24 23:39:56 +00:00
|
|
|
auto partition_key_names_and_types = executePartitionByExpression(metadata_snapshot, block, context);
|
|
|
|
value.resize(partition_key_names_and_types.size());
|
2020-05-05 15:06:16 +00:00
|
|
|
|
2021-05-24 23:39:56 +00:00
|
|
|
/// Executing partition_by expression adds new columns to passed block according to partition functions.
|
|
|
|
/// The block is passed by reference and is used afterwards. `moduloLegacy` needs to be substituted back
|
|
|
|
/// with just `modulo`, because it was a temporary substitution.
|
|
|
|
static constexpr auto modulo_legacy_function_name = "moduloLegacy";
|
|
|
|
|
|
|
|
size_t i = 0;
|
|
|
|
for (const auto & element : partition_key_names_and_types)
|
2020-05-05 15:06:16 +00:00
|
|
|
{
|
2021-05-24 23:39:56 +00:00
|
|
|
auto & partition_column = block.getByName(element.name);
|
2021-05-21 16:14:01 +00:00
|
|
|
|
2021-05-24 23:39:56 +00:00
|
|
|
if (element.name.starts_with(modulo_legacy_function_name))
|
|
|
|
partition_column.name = "modulo" + partition_column.name.substr(std::strlen(modulo_legacy_function_name));
|
2021-05-21 16:14:01 +00:00
|
|
|
|
2021-05-24 23:39:56 +00:00
|
|
|
partition_column.column->get(row, value[i++]);
|
2021-05-16 09:20:59 +00:00
|
|
|
}
|
2021-05-15 18:32:20 +00:00
|
|
|
}
|
2021-05-16 09:20:59 +00:00
|
|
|
|
2021-05-24 23:39:56 +00:00
|
|
|
NamesAndTypesList MergeTreePartition::executePartitionByExpression(const StorageMetadataPtr & metadata_snapshot, Block & block, ContextPtr context)
|
2021-05-21 16:14:01 +00:00
|
|
|
{
|
|
|
|
auto adjusted_partition_key = adjustPartitionKey(metadata_snapshot, context);
|
|
|
|
adjusted_partition_key.expression->execute(block);
|
2021-05-24 23:39:56 +00:00
|
|
|
return adjusted_partition_key.sample_block.getNamesAndTypesList();
|
2021-05-21 16:14:01 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
KeyDescription MergeTreePartition::adjustPartitionKey(const StorageMetadataPtr & metadata_snapshot, ContextPtr context)
|
|
|
|
{
|
|
|
|
const auto & partition_key = metadata_snapshot->getPartitionKey();
|
|
|
|
if (!partition_key.definition_ast)
|
|
|
|
return partition_key;
|
|
|
|
|
|
|
|
ASTPtr ast_copy = partition_key.definition_ast->clone();
|
|
|
|
|
|
|
|
/// Implementation of modulo function was changed from 8bit result type to 16bit. For backward compatibility partition by expression is always
|
|
|
|
/// calculated according to previous version - `moduloLegacy`.
|
|
|
|
if (KeyDescription::moduloToModuloLegacyRecursive(ast_copy))
|
|
|
|
{
|
|
|
|
auto adjusted_partition_key = KeyDescription::getKeyFromAST(ast_copy, metadata_snapshot->columns, context);
|
|
|
|
return adjusted_partition_key;
|
|
|
|
}
|
|
|
|
|
|
|
|
return partition_key;
|
|
|
|
}
|
|
|
|
|
2017-09-11 17:55:41 +00:00
|
|
|
}
|