#include #include #include #include #include #include #include #include #include #include #include #include #include #include namespace DB { namespace ErrorCodes { extern const int UNKNOWN_IDENTIFIER; extern const int UNKNOWN_ELEMENT_IN_AST; extern const int LOGICAL_ERROR; } bool TranslateQualifiedNamesMatcher::needChildVisit(ASTPtr & node, const ASTPtr & child) { /// Do not go to FROM, JOIN, subqueries. if (typeid_cast(child.get()) || typeid_cast(child.get())) return false; /// Processed nodes. Do not go into children. if (typeid_cast(node.get()) || typeid_cast(node.get())) return false; /// ASTSelectQuery + others return true; } std::vector TranslateQualifiedNamesMatcher::visit(ASTPtr & ast, Data & data) { if (auto * t = typeid_cast(ast.get())) return visit(*t, ast, data); if (auto * t = typeid_cast(ast.get())) return visit(*t, ast, data); if (auto * t = typeid_cast(ast.get())) return visit(*t, ast, data); if (auto * node = typeid_cast(ast.get())) visit(*node, ast, data); if (auto * node = typeid_cast(ast.get())) visit(*node, ast, data); return {}; } std::vector TranslateQualifiedNamesMatcher::visit(ASTIdentifier & identifier, ASTPtr &, Data & data) { if (IdentifierSemantic::getColumnName(identifier)) { size_t best_table_pos = 0; size_t best_match = 0; for (size_t i = 0; i < data.tables.size(); ++i) if (size_t match = IdentifierSemantic::canReferColumnToTable(identifier, data.tables[i].first)) if (match > best_match) { best_match = match; best_table_pos = i; } if (best_match) IdentifierSemantic::setMembership(identifier, best_table_pos + 1); /// In case if column from the joined table are in source columns, change it's name to qualified. if (best_table_pos && data.source_columns.count(identifier.shortName())) IdentifierSemantic::setNeedLongName(identifier, true); if (!data.tables.empty()) IdentifierSemantic::setColumnNormalName(identifier, data.tables[best_table_pos].first); } return {}; } /// As special case, treat count(*) as count(), not as count(list of all columns). void TranslateQualifiedNamesMatcher::visit(ASTFunction & node, const ASTPtr &, Data &) { ASTPtr & func_arguments = node.arguments; String func_name_lowercase = Poco::toLower(node.name); if (func_name_lowercase == "count" && func_arguments->children.size() == 1 && typeid_cast(func_arguments->children[0].get())) func_arguments->children.clear(); } std::vector TranslateQualifiedNamesMatcher::visit(const ASTQualifiedAsterisk & , const ASTPtr & ast, Data & data) { if (ast->children.size() != 1) throw Exception("Logical error: qualified asterisk must have exactly one child", ErrorCodes::LOGICAL_ERROR); auto & ident = ast->children[0]; /// @note it could contain table alias as table name. DatabaseAndTableWithAlias db_and_table(ident); for (const auto & known_table : data.tables) if (db_and_table.satisfies(known_table.first, true)) return {}; throw Exception("Unknown qualified identifier: " + ident->getAliasOrColumnName(), ErrorCodes::UNKNOWN_IDENTIFIER); } std::vector TranslateQualifiedNamesMatcher::visit(ASTTableJoin & join, const ASTPtr & , Data &) { std::vector out; if (join.using_expression_list) out.push_back(&join.using_expression_list); else if (join.on_expression) out.push_back(&join.on_expression); return out; } std::vector TranslateQualifiedNamesMatcher::visit(ASTSelectQuery & select, const ASTPtr & , Data & data) { if (auto join = select.join()) extractJoinUsingColumns(join->table_join, data); /// If the WHERE clause or HAVING consists of a single qualified column, the reference must be translated not only in children, /// but also in where_expression and having_expression. std::vector out; if (select.prewhere_expression) out.push_back(&select.prewhere_expression); if (select.where_expression) out.push_back(&select.where_expression); if (select.having_expression) out.push_back(&select.having_expression); return out; } /// Replace *, alias.*, database.table.* with a list of columns. void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPtr &, Data & data) { const auto & tables_with_columns = data.tables; const auto & source_columns = data.source_columns; ASTs old_children; if (data.processAsterisks()) { bool has_asterisk = false; for (const auto & child : node.children) { if (typeid_cast(child.get())) { if (tables_with_columns.empty()) throw Exception("An asterisk cannot be replaced with empty columns.", ErrorCodes::LOGICAL_ERROR); has_asterisk = true; break; } else if (auto qa = typeid_cast(child.get())) { visit(*qa, child, data); /// check if it's OK before rewrite has_asterisk = true; break; } } if (has_asterisk) { old_children.swap(node.children); node.children.reserve(old_children.size()); } } for (const auto & child : old_children) { if (typeid_cast(child.get())) { bool first_table = true; for (const auto & [table_name, table_columns] : tables_with_columns) { for (const auto & column_name : table_columns) if (first_table || !data.join_using_columns.count(column_name)) { /// qualifed names for duplicates if (!first_table && source_columns.count(column_name)) node.children.emplace_back(std::make_shared(table_name.getQualifiedNamePrefix() + column_name)); else node.children.emplace_back(std::make_shared(column_name)); } first_table = false; } } else if (const auto * qualified_asterisk = typeid_cast(child.get())) { DatabaseAndTableWithAlias ident_db_and_name(qualified_asterisk->children[0]); bool first_table = true; for (const auto & [table_name, table_columns] : tables_with_columns) { if (ident_db_and_name.satisfies(table_name, true)) { for (const auto & column_name : table_columns) { /// qualifed names for duplicates if (!first_table && source_columns.count(column_name)) node.children.emplace_back(std::make_shared(table_name.getQualifiedNamePrefix() + column_name)); else node.children.emplace_back(std::make_shared(column_name)); } break; } first_table = false; } } else node.children.emplace_back(child); } } /// 'select * from a join b using id' should result one 'id' column void TranslateQualifiedNamesMatcher::extractJoinUsingColumns(const ASTPtr ast, Data & data) { const auto & table_join = typeid_cast(*ast); if (table_join.using_expression_list) { auto & keys = typeid_cast(*table_join.using_expression_list); for (const auto & key : keys.children) if (auto opt_column = getIdentifierName(key)) data.join_using_columns.insert(*opt_column); else if (typeid_cast(key.get())) data.join_using_columns.insert(key->getColumnName()); else { String alias = key->tryGetAlias(); if (alias.empty()) throw Exception("Logical error: expected identifier or alias, got: " + key->getID(), ErrorCodes::LOGICAL_ERROR); data.join_using_columns.insert(alias); } } } }