2022-08-23 09:50:02 +00:00
|
|
|
#include <Analyzer/UnionNode.h>
|
|
|
|
|
|
|
|
#include <Common/SipHash.h>
|
2022-08-31 15:21:17 +00:00
|
|
|
#include <Common/FieldVisitorToString.h>
|
2022-08-23 09:50:02 +00:00
|
|
|
|
|
|
|
#include <Core/NamesAndTypes.h>
|
|
|
|
|
|
|
|
#include <IO/WriteBuffer.h>
|
|
|
|
#include <IO/WriteHelpers.h>
|
|
|
|
#include <IO/Operators.h>
|
|
|
|
|
|
|
|
#include <Parsers/ASTExpressionList.h>
|
|
|
|
#include <Parsers/ASTTablesInSelectQuery.h>
|
|
|
|
#include <Parsers/ASTSubquery.h>
|
|
|
|
#include <Parsers/ASTSelectQuery.h>
|
|
|
|
#include <Parsers/ASTSelectWithUnionQuery.h>
|
|
|
|
#include <Parsers/ASTIdentifier.h>
|
|
|
|
#include <Parsers/ASTFunction.h>
|
|
|
|
|
|
|
|
#include <Core/ColumnWithTypeAndName.h>
|
|
|
|
|
|
|
|
#include <DataTypes/getLeastSupertype.h>
|
|
|
|
|
|
|
|
#include <Analyzer/QueryNode.h>
|
|
|
|
#include <Analyzer/Utils.h>
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
|
|
|
extern const int TYPE_MISMATCH;
|
|
|
|
}
|
|
|
|
|
|
|
|
UnionNode::UnionNode()
|
2022-10-07 10:44:28 +00:00
|
|
|
: IQueryTreeNode(children_size)
|
2022-08-23 09:50:02 +00:00
|
|
|
{
|
|
|
|
children[queries_child_index] = std::make_shared<ListNode>();
|
|
|
|
}
|
|
|
|
|
2022-08-31 15:21:17 +00:00
|
|
|
NamesAndTypes UnionNode::computeProjectionColumns() const
|
2022-08-23 09:50:02 +00:00
|
|
|
{
|
|
|
|
std::vector<NamesAndTypes> projections;
|
|
|
|
|
|
|
|
NamesAndTypes query_node_projection;
|
|
|
|
|
2022-10-17 17:46:30 +00:00
|
|
|
const auto & query_nodes = getQueries().getNodes();
|
|
|
|
projections.reserve(query_nodes.size());
|
|
|
|
|
2022-08-23 09:50:02 +00:00
|
|
|
for (const auto & query_node : query_nodes)
|
|
|
|
{
|
|
|
|
if (auto * query_node_typed = query_node->as<QueryNode>())
|
|
|
|
{
|
2022-08-31 15:21:17 +00:00
|
|
|
auto projection_columns = query_node_typed->getProjectionColumns();
|
2022-08-23 09:50:02 +00:00
|
|
|
query_node_projection = NamesAndTypes(projection_columns.begin(), projection_columns.end());
|
|
|
|
}
|
|
|
|
else if (auto * union_node_typed = query_node->as<UnionNode>())
|
|
|
|
{
|
|
|
|
auto projection_columns = union_node_typed->computeProjectionColumns();
|
|
|
|
query_node_projection = NamesAndTypes(projection_columns.begin(), projection_columns.end());
|
|
|
|
}
|
|
|
|
|
|
|
|
projections.push_back(query_node_projection);
|
|
|
|
|
|
|
|
if (query_node_projection.size() != projections.front().size())
|
|
|
|
throw Exception(ErrorCodes::TYPE_MISMATCH, "UNION different number of columns in queries");
|
|
|
|
}
|
|
|
|
|
2022-08-31 15:21:17 +00:00
|
|
|
NamesAndTypes result_columns;
|
2022-08-23 09:50:02 +00:00
|
|
|
|
|
|
|
size_t projections_size = projections.size();
|
|
|
|
DataTypes projection_column_types;
|
|
|
|
projection_column_types.resize(projections_size);
|
|
|
|
|
|
|
|
size_t columns_size = query_node_projection.size();
|
|
|
|
for (size_t column_index = 0; column_index < columns_size; ++column_index)
|
|
|
|
{
|
|
|
|
for (size_t projection_index = 0; projection_index < projections_size; ++projection_index)
|
|
|
|
projection_column_types[projection_index] = projections[projection_index][column_index].type;
|
|
|
|
|
|
|
|
auto result_type = getLeastSupertype(projection_column_types);
|
|
|
|
result_columns.emplace_back(projections.front()[column_index].name, std::move(result_type));
|
|
|
|
}
|
|
|
|
|
|
|
|
return result_columns;
|
|
|
|
}
|
|
|
|
|
|
|
|
String UnionNode::getName() const
|
|
|
|
{
|
|
|
|
WriteBufferFromOwnString buffer;
|
|
|
|
|
|
|
|
auto query_nodes = getQueries().getNodes();
|
|
|
|
size_t query_nodes_size = query_nodes.size();
|
|
|
|
|
|
|
|
for (size_t i = 0; i < query_nodes_size; ++i)
|
|
|
|
{
|
|
|
|
const auto & query_node = query_nodes[i];
|
|
|
|
buffer << query_node->getName();
|
|
|
|
|
|
|
|
if (i == 0)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
auto query_union_mode = union_modes.at(i - 1);
|
2022-09-06 16:46:30 +00:00
|
|
|
|
|
|
|
if (query_union_mode == SelectUnionMode::UNION_DEFAULT)
|
|
|
|
buffer << "UNION";
|
|
|
|
else if (query_union_mode == SelectUnionMode::UNION_ALL)
|
|
|
|
buffer << "UNION ALL";
|
|
|
|
else if (query_union_mode == SelectUnionMode::UNION_DISTINCT)
|
|
|
|
buffer << "UNION DISTINCT";
|
|
|
|
else if (query_union_mode == SelectUnionMode::EXCEPT_DEFAULT)
|
|
|
|
buffer << "EXCEPT";
|
|
|
|
else if (query_union_mode == SelectUnionMode::EXCEPT_ALL)
|
|
|
|
buffer << "EXCEPT ALL";
|
|
|
|
else if (query_union_mode == SelectUnionMode::EXCEPT_DISTINCT)
|
|
|
|
buffer << "EXCEPT DISTINCT";
|
|
|
|
else if (query_union_mode == SelectUnionMode::INTERSECT_DEFAULT)
|
|
|
|
buffer << "INTERSECT";
|
|
|
|
else if (query_union_mode == SelectUnionMode::INTERSECT_ALL)
|
|
|
|
buffer << "INTERSECT ALL";
|
|
|
|
else if (query_union_mode == SelectUnionMode::INTERSECT_DISTINCT)
|
|
|
|
buffer << "INTERSECT DISTINCT";
|
2022-08-23 09:50:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return buffer.str();
|
|
|
|
}
|
|
|
|
|
|
|
|
void UnionNode::dumpTreeImpl(WriteBuffer & buffer, FormatState & format_state, size_t indent) const
|
|
|
|
{
|
|
|
|
buffer << std::string(indent, ' ') << "UNION id: " << format_state.getNodeId(this);
|
|
|
|
|
|
|
|
if (hasAlias())
|
|
|
|
buffer << ", alias: " << getAlias();
|
|
|
|
|
|
|
|
buffer << ", is_subquery: " << is_subquery;
|
|
|
|
buffer << ", is_cte: " << is_cte;
|
|
|
|
|
|
|
|
if (!cte_name.empty())
|
|
|
|
buffer << ", cte_name: " << cte_name;
|
|
|
|
|
2022-08-31 15:21:17 +00:00
|
|
|
if (constant_value)
|
|
|
|
{
|
|
|
|
buffer << ", constant_value: " << constant_value->getValue().dump();
|
|
|
|
buffer << ", constant_value_type: " << constant_value->getType()->getName();
|
|
|
|
}
|
|
|
|
|
2022-09-04 15:20:59 +00:00
|
|
|
if (table_expression_modifiers)
|
|
|
|
{
|
|
|
|
buffer << ", ";
|
|
|
|
table_expression_modifiers->dump(buffer);
|
|
|
|
}
|
|
|
|
|
2022-09-06 16:46:30 +00:00
|
|
|
buffer << ", union_mode: " << toString(union_mode);
|
2022-08-23 09:50:02 +00:00
|
|
|
|
|
|
|
size_t union_modes_size = union_modes.size();
|
|
|
|
buffer << '\n' << std::string(indent + 2, ' ') << "UNION MODES " << union_modes_size << '\n';
|
|
|
|
|
|
|
|
for (size_t i = 0; i < union_modes_size; ++i)
|
|
|
|
{
|
|
|
|
buffer << std::string(indent + 4, ' ');
|
|
|
|
|
|
|
|
auto query_union_mode = union_modes[i];
|
2022-09-06 16:46:30 +00:00
|
|
|
buffer << toString(query_union_mode);
|
2022-08-23 09:50:02 +00:00
|
|
|
|
|
|
|
if (i + 1 != union_modes_size)
|
|
|
|
buffer << '\n';
|
|
|
|
}
|
|
|
|
|
|
|
|
buffer << '\n' << std::string(indent + 2, ' ') << "QUERIES\n";
|
|
|
|
getQueriesNode()->dumpTreeImpl(buffer, format_state, indent + 4);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool UnionNode::isEqualImpl(const IQueryTreeNode & rhs) const
|
|
|
|
{
|
|
|
|
const auto & rhs_typed = assert_cast<const UnionNode &>(rhs);
|
2022-08-31 15:21:17 +00:00
|
|
|
if (constant_value && rhs_typed.constant_value && *constant_value != *rhs_typed.constant_value)
|
|
|
|
return false;
|
|
|
|
else if (constant_value && !rhs_typed.constant_value)
|
|
|
|
return false;
|
|
|
|
else if (!constant_value && rhs_typed.constant_value)
|
|
|
|
return false;
|
|
|
|
|
2022-09-04 15:20:59 +00:00
|
|
|
if (table_expression_modifiers && rhs_typed.table_expression_modifiers && table_expression_modifiers != rhs_typed.table_expression_modifiers)
|
|
|
|
return false;
|
|
|
|
else if (table_expression_modifiers && !rhs_typed.table_expression_modifiers)
|
|
|
|
return false;
|
|
|
|
else if (!table_expression_modifiers && rhs_typed.table_expression_modifiers)
|
|
|
|
return false;
|
|
|
|
|
2022-08-23 09:50:02 +00:00
|
|
|
return is_subquery == rhs_typed.is_subquery && is_cte == rhs_typed.is_cte && cte_name == rhs_typed.cte_name;
|
|
|
|
}
|
|
|
|
|
|
|
|
void UnionNode::updateTreeHashImpl(HashState & state) const
|
|
|
|
{
|
|
|
|
state.update(is_subquery);
|
|
|
|
state.update(is_cte);
|
|
|
|
|
|
|
|
state.update(cte_name.size());
|
|
|
|
state.update(cte_name);
|
2022-08-31 15:21:17 +00:00
|
|
|
|
|
|
|
if (constant_value)
|
|
|
|
{
|
|
|
|
auto constant_dump = applyVisitor(FieldVisitorToString(), constant_value->getValue());
|
|
|
|
state.update(constant_dump.size());
|
|
|
|
state.update(constant_dump);
|
|
|
|
|
|
|
|
auto constant_value_type_name = constant_value->getType()->getName();
|
|
|
|
state.update(constant_value_type_name.size());
|
|
|
|
state.update(constant_value_type_name);
|
|
|
|
}
|
2022-09-04 15:20:59 +00:00
|
|
|
|
|
|
|
if (table_expression_modifiers)
|
|
|
|
table_expression_modifiers->updateTreeHash(state);
|
2022-08-23 09:50:02 +00:00
|
|
|
}
|
|
|
|
|
2022-10-10 10:25:58 +00:00
|
|
|
QueryTreeNodePtr UnionNode::cloneImpl() const
|
|
|
|
{
|
|
|
|
auto result_query_node = std::make_shared<UnionNode>();
|
|
|
|
|
|
|
|
result_query_node->is_subquery = is_subquery;
|
|
|
|
result_query_node->is_cte = is_cte;
|
|
|
|
result_query_node->cte_name = cte_name;
|
|
|
|
result_query_node->union_mode = union_mode;
|
|
|
|
result_query_node->union_modes = union_modes;
|
|
|
|
result_query_node->union_modes_set = union_modes_set;
|
|
|
|
result_query_node->constant_value = constant_value;
|
|
|
|
result_query_node->table_expression_modifiers = table_expression_modifiers;
|
|
|
|
|
|
|
|
return result_query_node;
|
|
|
|
}
|
|
|
|
|
2022-08-23 09:50:02 +00:00
|
|
|
ASTPtr UnionNode::toASTImpl() const
|
|
|
|
{
|
|
|
|
auto select_with_union_query = std::make_shared<ASTSelectWithUnionQuery>();
|
|
|
|
select_with_union_query->union_mode = union_mode;
|
2022-09-06 16:46:30 +00:00
|
|
|
|
|
|
|
if (union_mode != SelectUnionMode::UNION_DEFAULT &&
|
|
|
|
union_mode != SelectUnionMode::EXCEPT_DEFAULT &&
|
2022-10-17 17:46:30 +00:00
|
|
|
union_mode != SelectUnionMode::INTERSECT_DEFAULT)
|
2022-09-06 16:46:30 +00:00
|
|
|
select_with_union_query->is_normalized = true;
|
|
|
|
|
2022-08-23 09:50:02 +00:00
|
|
|
select_with_union_query->list_of_modes = union_modes;
|
|
|
|
select_with_union_query->set_of_modes = union_modes_set;
|
|
|
|
select_with_union_query->children.push_back(getQueriesNode()->toAST());
|
|
|
|
select_with_union_query->list_of_selects = select_with_union_query->children.back();
|
|
|
|
|
|
|
|
return select_with_union_query;
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|