2019-04-15 09:30:45 +00:00
|
|
|
#include <Storages/MergeTree/TTLMergeSelector.h>
|
2020-07-28 14:38:34 +00:00
|
|
|
#include <Storages/MergeTree/MergeTreeData.h>
|
2020-09-02 12:16:12 +00:00
|
|
|
#include <Parsers/queryToString.h>
|
2019-04-15 09:30:45 +00:00
|
|
|
|
|
|
|
#include <algorithm>
|
2020-07-28 14:38:34 +00:00
|
|
|
#include <cmath>
|
2019-04-15 09:30:45 +00:00
|
|
|
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2020-09-02 10:30:04 +00:00
|
|
|
const String & getPartitionIdForPart(const ITTLMergeSelector::Part & part_info)
|
2020-07-28 14:38:34 +00:00
|
|
|
{
|
|
|
|
const MergeTreeData::DataPartPtr & part = *static_cast<const MergeTreeData::DataPartPtr *>(part_info.data);
|
|
|
|
return part->info.partition_id;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-09-04 10:52:51 +00:00
|
|
|
IMergeSelector::PartsRange ITTLMergeSelector::select(
|
2020-09-03 13:29:18 +00:00
|
|
|
const PartsRanges & parts_ranges,
|
2019-04-15 09:30:45 +00:00
|
|
|
const size_t max_total_size_to_merge)
|
|
|
|
{
|
2020-09-03 13:29:18 +00:00
|
|
|
using Iterator = IMergeSelector::PartsRange::const_iterator;
|
2019-04-15 09:30:45 +00:00
|
|
|
Iterator best_begin;
|
|
|
|
ssize_t partition_to_merge_index = -1;
|
|
|
|
time_t partition_to_merge_min_ttl = 0;
|
|
|
|
|
2020-09-03 13:29:18 +00:00
|
|
|
for (size_t i = 0; i < parts_ranges.size(); ++i)
|
2019-04-15 09:30:45 +00:00
|
|
|
{
|
2020-09-03 13:29:18 +00:00
|
|
|
const auto & mergeable_parts_in_partition = parts_ranges[i];
|
2020-07-28 14:38:34 +00:00
|
|
|
if (mergeable_parts_in_partition.empty())
|
|
|
|
continue;
|
|
|
|
|
|
|
|
const auto & partition_id = getPartitionIdForPart(mergeable_parts_in_partition.front());
|
|
|
|
const auto & next_merge_time_for_partition = merge_due_times[partition_id];
|
|
|
|
if (next_merge_time_for_partition > current_time)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
for (Iterator part_it = mergeable_parts_in_partition.cbegin(); part_it != mergeable_parts_in_partition.cend(); ++part_it)
|
2019-04-15 09:30:45 +00:00
|
|
|
{
|
2020-09-02 10:30:04 +00:00
|
|
|
time_t ttl = getTTLForPart(*part_it);
|
2019-07-28 10:30:46 +00:00
|
|
|
|
2020-09-02 12:16:12 +00:00
|
|
|
if (ttl && !isTTLAlreadySatisfied(*part_it) && (partition_to_merge_index == -1 || ttl < partition_to_merge_min_ttl))
|
2019-04-15 09:30:45 +00:00
|
|
|
{
|
2020-08-21 15:44:29 +00:00
|
|
|
partition_to_merge_min_ttl = ttl;
|
|
|
|
partition_to_merge_index = i;
|
|
|
|
best_begin = part_it;
|
2019-04-15 09:30:45 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (partition_to_merge_index == -1 || partition_to_merge_min_ttl > current_time)
|
|
|
|
return {};
|
|
|
|
|
2020-09-03 13:29:18 +00:00
|
|
|
const auto & best_partition = parts_ranges[partition_to_merge_index];
|
2019-04-15 09:30:45 +00:00
|
|
|
Iterator best_end = best_begin + 1;
|
|
|
|
size_t total_size = 0;
|
|
|
|
|
|
|
|
while (true)
|
|
|
|
{
|
2020-09-02 10:30:04 +00:00
|
|
|
time_t ttl = getTTLForPart(*best_begin);
|
2019-07-28 10:30:46 +00:00
|
|
|
|
2020-09-02 12:16:12 +00:00
|
|
|
if (!ttl || isTTLAlreadySatisfied(*best_begin) || ttl > current_time
|
2020-08-21 15:44:29 +00:00
|
|
|
|| (max_total_size_to_merge && total_size > max_total_size_to_merge))
|
2019-04-15 09:30:45 +00:00
|
|
|
{
|
|
|
|
++best_begin;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
total_size += best_begin->size;
|
|
|
|
if (best_begin == best_partition.begin())
|
|
|
|
break;
|
|
|
|
|
|
|
|
--best_begin;
|
|
|
|
}
|
|
|
|
|
|
|
|
while (best_end != best_partition.end())
|
|
|
|
{
|
2020-09-02 10:30:04 +00:00
|
|
|
time_t ttl = getTTLForPart(*best_end);
|
2019-07-28 10:30:46 +00:00
|
|
|
|
2020-09-02 12:16:12 +00:00
|
|
|
if (!ttl || isTTLAlreadySatisfied(*best_end) || ttl > current_time
|
2020-08-21 15:44:29 +00:00
|
|
|
|| (max_total_size_to_merge && total_size > max_total_size_to_merge))
|
2019-04-15 09:30:45 +00:00
|
|
|
break;
|
|
|
|
|
|
|
|
total_size += best_end->size;
|
|
|
|
++best_end;
|
|
|
|
}
|
|
|
|
|
2020-07-28 14:38:34 +00:00
|
|
|
const auto & best_partition_id = getPartitionIdForPart(best_partition.front());
|
|
|
|
merge_due_times[best_partition_id] = current_time + merge_cooldown_time;
|
|
|
|
|
2020-09-03 13:29:18 +00:00
|
|
|
return PartsRange(best_begin, best_end);
|
2019-04-15 09:30:45 +00:00
|
|
|
}
|
|
|
|
|
2020-09-02 10:30:04 +00:00
|
|
|
time_t TTLDeleteMergeSelector::getTTLForPart(const IMergeSelector::Part & part) const
|
|
|
|
{
|
2020-09-02 12:16:12 +00:00
|
|
|
return only_drop_parts ? part.ttl_infos.part_max_ttl : part.ttl_infos.part_min_ttl;
|
2020-09-02 10:30:04 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
time_t TTLRecompressMergeSelector::getTTLForPart(const IMergeSelector::Part & part) const
|
|
|
|
{
|
2020-09-09 09:15:42 +00:00
|
|
|
return part.ttl_infos.getMinimalMaxRecompressionTTL();
|
2020-09-02 12:16:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
bool TTLRecompressMergeSelector::isTTLAlreadySatisfied(const IMergeSelector::Part & part) const
|
|
|
|
{
|
|
|
|
if (recompression_ttls.empty())
|
|
|
|
return false;
|
|
|
|
|
2020-09-09 09:15:42 +00:00
|
|
|
auto ttl_description = selectTTLDescriptionForTTLInfos(recompression_ttls, part.ttl_infos.recompression_ttl, current_time, true);
|
2020-09-02 12:16:12 +00:00
|
|
|
|
|
|
|
if (!ttl_description)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
auto ast_to_str = [](ASTPtr query) -> String
|
|
|
|
{
|
|
|
|
if (!query)
|
|
|
|
return "";
|
|
|
|
return queryToString(query);
|
|
|
|
};
|
|
|
|
|
|
|
|
return ast_to_str(ttl_description->recompression_codec) == ast_to_str(part.compression_codec_desc);
|
2020-09-02 10:30:04 +00:00
|
|
|
}
|
|
|
|
|
2019-04-15 09:30:45 +00:00
|
|
|
}
|