mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-10-05 08:00:51 +00:00
105 lines
3.5 KiB
C++
105 lines
3.5 KiB
C++
|
#include <Storages/ReadInOrderOptimizer.h>
|
||
|
#include <Storages/MergeTree/MergeTreeData.h>
|
||
|
#include <Functions/IFunction.h>
|
||
|
|
||
|
namespace DB
|
||
|
{
|
||
|
|
||
|
namespace ErrorCodes
|
||
|
{
|
||
|
extern const int LOGICAL_ERROR;
|
||
|
}
|
||
|
|
||
|
|
||
|
ReadInOrderOptimizer::ReadInOrderOptimizer(
|
||
|
const ManyExpressionActions & elements_actions_,
|
||
|
const SortDescription & required_sort_description_,
|
||
|
const SyntaxAnalyzerResultPtr & syntax_result)
|
||
|
: elements_actions(elements_actions_)
|
||
|
, required_sort_description(required_sort_description_)
|
||
|
{
|
||
|
if (elements_actions.size() != required_sort_description.size())
|
||
|
throw Exception("Sizes of sort decription and actions are mismatched", ErrorCodes::LOGICAL_ERROR);
|
||
|
|
||
|
/// Do not analyze ARRAY JOIN result columns.
|
||
|
/// TODO: forbid more columns for analyzing.
|
||
|
for (const auto & elem : syntax_result->array_join_result_to_source)
|
||
|
forbidden_columns.insert(elem.first);
|
||
|
}
|
||
|
|
||
|
InputSortingInfoPtr ReadInOrderOptimizer::analyze(const MergeTreeData & merge_tree)
|
||
|
{
|
||
|
if (!merge_tree.hasSortingKey())
|
||
|
return {};
|
||
|
|
||
|
SortDescription order_key_prefix_descr;
|
||
|
int read_direction = required_sort_description.at(0).direction;
|
||
|
|
||
|
const auto & sorting_key_columns = merge_tree.getSortingKeyColumns();
|
||
|
size_t prefix_size = std::min(required_sort_description.size(), sorting_key_columns.size());
|
||
|
|
||
|
for (size_t i = 0; i < prefix_size; ++i)
|
||
|
{
|
||
|
if (forbidden_columns.count(required_sort_description[i].column_name))
|
||
|
break;
|
||
|
|
||
|
/// Optimize in case of exact match with order key element
|
||
|
/// or in some simple cases when order key element is wrapped into monotonic function.
|
||
|
int current_direction = required_sort_description[i].direction;
|
||
|
if (required_sort_description[i].column_name == sorting_key_columns[i] && current_direction == read_direction)
|
||
|
order_key_prefix_descr.push_back(required_sort_description[i]);
|
||
|
else
|
||
|
{
|
||
|
const auto & input_columns = elements_actions[i]->getRequiredColumnsWithTypes();
|
||
|
if (input_columns.size() != 1 || input_columns.front().name != sorting_key_columns[i])
|
||
|
break;
|
||
|
|
||
|
bool first = true;
|
||
|
for (const auto & action : elements_actions[i]->getActions())
|
||
|
{
|
||
|
if (action.type != ExpressionAction::APPLY_FUNCTION)
|
||
|
continue;
|
||
|
|
||
|
if (!first)
|
||
|
{
|
||
|
current_direction = 0;
|
||
|
break;
|
||
|
}
|
||
|
else
|
||
|
first = false;
|
||
|
|
||
|
const auto & func = *action.function_base;
|
||
|
if (!func.hasInformationAboutMonotonicity())
|
||
|
{
|
||
|
current_direction = 0;
|
||
|
break;
|
||
|
}
|
||
|
|
||
|
auto monotonicity = func.getMonotonicityForRange(*input_columns.front().type, {}, {});
|
||
|
if (!monotonicity.is_monotonic)
|
||
|
{
|
||
|
current_direction = 0;
|
||
|
break;
|
||
|
}
|
||
|
else if (!monotonicity.is_positive)
|
||
|
current_direction *= -1;
|
||
|
}
|
||
|
|
||
|
if (!current_direction || (i > 0 && current_direction != read_direction))
|
||
|
break;
|
||
|
|
||
|
if (i == 0)
|
||
|
read_direction = current_direction;
|
||
|
|
||
|
order_key_prefix_descr.push_back(required_sort_description[i]);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if (order_key_prefix_descr.empty())
|
||
|
return {};
|
||
|
|
||
|
return std::make_shared<InputSortingInfo>(std::move(order_key_prefix_descr), read_direction);
|
||
|
}
|
||
|
|
||
|
}
|