ClickHouse/src/Storages/ReadInOrderOptimizer.cpp

129 lines
4.3 KiB
C++
Raw Normal View History

2019-12-10 23:18:24 +00:00
#include <Storages/ReadInOrderOptimizer.h>
#include <Storages/MergeTree/MergeTreeData.h>
2020-03-19 11:34:54 +00:00
#include <Storages/MergeTree/StorageFromMergeTreeDataPart.h>
#include <Interpreters/TableJoin.h>
2019-12-10 23:18:24 +00:00
#include <Functions/IFunction.h>
namespace DB
{
namespace ErrorCodes
{
extern const int LOGICAL_ERROR;
}
ReadInOrderOptimizer::ReadInOrderOptimizer(
const ManyExpressionActions & elements_actions_,
const SortDescription & required_sort_description_,
const TreeRewriterResultPtr & syntax_result)
2019-12-10 23:18:24 +00:00
: elements_actions(elements_actions_)
, required_sort_description(required_sort_description_)
{
if (elements_actions.size() != required_sort_description.size())
2019-12-11 01:34:39 +00:00
throw Exception("Sizes of sort description and actions are mismatched", ErrorCodes::LOGICAL_ERROR);
2019-12-10 23:18:24 +00:00
/// Do not analyze joined columns.
2020-01-11 09:50:41 +00:00
/// They may have aliases and come to description as is.
/// We can mismatch them with order key columns at stage of fetching columns.
2019-12-10 23:18:24 +00:00
for (const auto & elem : syntax_result->array_join_result_to_source)
forbidden_columns.insert(elem.first);
}
2020-06-17 11:05:11 +00:00
InputOrderInfoPtr ReadInOrderOptimizer::getInputOrder(const StoragePtr & storage, const StorageMetadataPtr & metadata_snapshot) const
2019-12-10 23:18:24 +00:00
{
2020-03-19 11:31:21 +00:00
Names sorting_key_columns;
2020-06-18 16:10:47 +00:00
if (dynamic_cast<const MergeTreeData *>(storage.get()))
2020-03-19 11:31:21 +00:00
{
2020-06-17 11:05:11 +00:00
if (!metadata_snapshot->hasSortingKey())
2020-03-19 11:31:21 +00:00
return {};
2020-06-17 11:05:11 +00:00
sorting_key_columns = metadata_snapshot->getSortingKeyColumns();
2020-03-19 11:31:21 +00:00
}
2020-06-18 16:10:47 +00:00
else if (dynamic_cast<const StorageFromMergeTreeDataPart *>(storage.get()))
2020-03-19 11:31:21 +00:00
{
2020-06-17 11:05:11 +00:00
if (!metadata_snapshot->hasSortingKey())
2020-03-19 11:31:21 +00:00
return {};
2020-06-17 11:05:11 +00:00
sorting_key_columns = metadata_snapshot->getSortingKeyColumns();
2020-03-19 11:31:21 +00:00
}
else /// Inapplicable storage type
{
2019-12-10 23:18:24 +00:00
return {};
2020-03-19 11:31:21 +00:00
}
2019-12-10 23:18:24 +00:00
SortDescription order_key_prefix_descr;
int read_direction = required_sort_description.at(0).direction;
size_t prefix_size = std::min(required_sort_description.size(), sorting_key_columns.size());
2020-05-08 19:46:52 +00:00
2019-12-10 23:18:24 +00:00
for (size_t i = 0; i < prefix_size; ++i)
{
if (forbidden_columns.count(required_sort_description[i].column_name))
break;
/// Optimize in case of exact match with order key element
/// or in some simple cases when order key element is wrapped into monotonic function.
int current_direction = required_sort_description[i].direction;
if (required_sort_description[i].column_name == sorting_key_columns[i] && current_direction == read_direction)
order_key_prefix_descr.push_back(required_sort_description[i]);
else
{
2019-12-11 18:52:59 +00:00
/// Allow only one simple monotonic functions with one argument
bool found_function = false;
2019-12-10 23:18:24 +00:00
for (const auto & action : elements_actions[i]->getActions())
{
if (action.type != ExpressionAction::APPLY_FUNCTION)
continue;
2019-12-11 18:52:59 +00:00
if (found_function)
2019-12-10 23:18:24 +00:00
{
current_direction = 0;
break;
}
else
2019-12-11 18:52:59 +00:00
found_function = true;
2020-05-08 19:46:52 +00:00
if (action.argument_names.size() != 1 || action.argument_names.at(0) != sorting_key_columns[i])
{
current_direction = 0;
break;
}
2019-12-10 23:18:24 +00:00
const auto & func = *action.function_base;
if (!func.hasInformationAboutMonotonicity())
{
current_direction = 0;
break;
}
2020-05-08 19:46:52 +00:00
auto monotonicity = func.getMonotonicityForRange(*func.getArgumentTypes().at(0), {}, {});
2019-12-10 23:18:24 +00:00
if (!monotonicity.is_monotonic)
{
current_direction = 0;
break;
}
else if (!monotonicity.is_positive)
current_direction *= -1;
}
2019-12-11 18:52:59 +00:00
if (!found_function)
current_direction = 0;
2020-05-08 19:46:52 +00:00
2019-12-10 23:18:24 +00:00
if (!current_direction || (i > 0 && current_direction != read_direction))
break;
2020-05-08 19:46:52 +00:00
2019-12-10 23:18:24 +00:00
if (i == 0)
read_direction = current_direction;
order_key_prefix_descr.push_back(required_sort_description[i]);
}
}
if (order_key_prefix_descr.empty())
return {};
2020-05-13 13:49:10 +00:00
return std::make_shared<InputOrderInfo>(std::move(order_key_prefix_descr), read_direction);
2019-12-10 23:18:24 +00:00
}
}