#include #include #include #include #include namespace DB { namespace ErrorCodes { extern const int EXPECTED_ALL_OR_DISTINCT; extern const int LOGICAL_ERROR; } void NormalizeSelectWithUnionQueryMatcher::getSelectsFromUnionListNode(ASTPtr ast_select, ASTs & selects) { if (const auto * inner_union = ast_select->as()) { for (const auto & child : inner_union->list_of_selects->children) getSelectsFromUnionListNode(child, selects); return; } selects.push_back(ast_select); } void NormalizeSelectWithUnionQueryMatcher::visit(ASTPtr & ast, Data & data) { if (auto * select_union = ast->as()) visit(*select_union, data); } void NormalizeSelectWithUnionQueryMatcher::visit(ASTSelectWithUnionQuery & ast, Data & data) { auto & union_modes = ast.list_of_modes; ASTs selects; const auto & select_list = ast.list_of_selects->children; if (select_list.empty()) throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty list of selects for ASTSelectWithUnionQuery"); /// Since nodes are traversed from bottom to top, we can also collect union modes from children up to parents. SelectUnionModesSet current_set_of_modes; bool distinct_found = false; for (Int64 i = union_modes.size() - 1; i >= 0; --i) { current_set_of_modes.insert(union_modes[i]); if (const auto * union_ast = typeid_cast(select_list[i + 1].get())) { const auto & current_select_modes = union_ast->set_of_modes; current_set_of_modes.insert(current_select_modes.begin(), current_select_modes.end()); } if (distinct_found) continue; /// Rewrite UNION Mode if (union_modes[i] == SelectUnionMode::UNION_DEFAULT) { if (data.union_default_mode == SetOperationMode::ALL) union_modes[i] = SelectUnionMode::UNION_ALL; else if (data.union_default_mode == SetOperationMode::DISTINCT) union_modes[i] = SelectUnionMode::UNION_DISTINCT; else throw Exception(DB::ErrorCodes::EXPECTED_ALL_OR_DISTINCT, "Expected ALL or DISTINCT in SelectWithUnion query, because setting (union_default_mode) is empty"); } if (union_modes[i] == SelectUnionMode::UNION_ALL) { if (auto * inner_union = select_list[i + 1]->as(); inner_union && inner_union->union_mode == SelectUnionMode::UNION_ALL) { /// Inner_union is an UNION ALL list, just lift up for (auto child = inner_union->list_of_selects->children.rbegin(); child != inner_union->list_of_selects->children.rend(); ++child) selects.push_back(*child); } else selects.push_back(select_list[i + 1]); } /// flatten all left nodes and current node to a UNION DISTINCT list else if (union_modes[i] == SelectUnionMode::UNION_DISTINCT) { auto distinct_list = std::make_shared(); distinct_list->list_of_selects = std::make_shared(); distinct_list->children.push_back(distinct_list->list_of_selects); for (int j = 0; j <= i + 1; ++j) { getSelectsFromUnionListNode(select_list[j], distinct_list->list_of_selects->children); } distinct_list->union_mode = SelectUnionMode::UNION_DISTINCT; distinct_list->is_normalized = true; selects.push_back(std::move(distinct_list)); distinct_found = true; } } if (const auto * union_ast = typeid_cast(select_list[0].get())) { const auto & current_select_modes = union_ast->set_of_modes; current_set_of_modes.insert(current_select_modes.begin(), current_select_modes.end()); } /// No UNION DISTINCT or only one child in select_list if (!distinct_found) { if (auto * inner_union = select_list[0]->as(); inner_union && inner_union->union_mode == SelectUnionMode::UNION_ALL) { /// Inner_union is an UNION ALL list, just lift it up for (auto child = inner_union->list_of_selects->children.rbegin(); child != inner_union->list_of_selects->children.rend(); ++child) selects.push_back(*child); } else selects.push_back(select_list[0]); } /// Just one union type child, lift it up if (selects.size() == 1 && selects[0]->as()) { ast = *(selects[0]->as()); ast.set_of_modes = std::move(current_set_of_modes); return; } // reverse children list std::reverse(selects.begin(), selects.end()); ast.is_normalized = true; ast.union_mode = SelectUnionMode::UNION_ALL; ast.set_of_modes = std::move(current_set_of_modes); ast.list_of_selects->children = std::move(selects); } }