2019-01-25 15:42:24 +00:00
|
|
|
#include <Common/typeid_cast.h>
|
|
|
|
|
|
|
|
#include <Interpreters/IdentifierSemantic.h>
|
2020-03-13 10:30:55 +00:00
|
|
|
#include <Interpreters/StorageID.h>
|
2019-01-25 15:42:24 +00:00
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2019-10-17 21:08:28 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
2020-02-25 18:02:41 +00:00
|
|
|
extern const int LOGICAL_ERROR;
|
2019-10-17 21:08:28 +00:00
|
|
|
extern const int AMBIGUOUS_COLUMN_NAME;
|
|
|
|
}
|
|
|
|
|
2019-10-16 17:33:53 +00:00
|
|
|
namespace
|
|
|
|
{
|
|
|
|
|
|
|
|
template <typename T>
|
2020-03-08 11:07:05 +00:00
|
|
|
std::optional<size_t> tryChooseTable(const ASTIdentifier & identifier, const std::vector<T> & tables, bool allow_ambiguous)
|
2019-10-16 17:33:53 +00:00
|
|
|
{
|
2019-10-17 21:08:28 +00:00
|
|
|
using ColumnMatch = IdentifierSemantic::ColumnMatch;
|
|
|
|
|
2020-03-08 11:07:05 +00:00
|
|
|
size_t best_table_pos = 0;
|
2019-10-17 21:08:28 +00:00
|
|
|
auto best_match = ColumnMatch::NoMatch;
|
|
|
|
size_t same_match = 0;
|
|
|
|
|
2019-10-16 17:33:53 +00:00
|
|
|
for (size_t i = 0; i < tables.size(); ++i)
|
2019-10-17 21:08:28 +00:00
|
|
|
{
|
2020-03-08 11:07:05 +00:00
|
|
|
auto match = IdentifierSemantic::canReferColumnToTable(identifier, tables[i]);
|
2019-10-24 13:04:50 +00:00
|
|
|
if (match != ColumnMatch::NoMatch)
|
2019-10-17 21:08:28 +00:00
|
|
|
{
|
2019-10-24 13:04:50 +00:00
|
|
|
if (match > best_match)
|
2019-10-16 17:33:53 +00:00
|
|
|
{
|
|
|
|
best_match = match;
|
|
|
|
best_table_pos = i;
|
2019-10-17 21:08:28 +00:00
|
|
|
same_match = 0;
|
2019-10-16 17:33:53 +00:00
|
|
|
}
|
2019-10-17 21:08:28 +00:00
|
|
|
else if (match == best_match)
|
|
|
|
++same_match;
|
|
|
|
}
|
|
|
|
}
|
2019-10-16 17:33:53 +00:00
|
|
|
|
2019-10-24 13:04:50 +00:00
|
|
|
if ((best_match != ColumnMatch::NoMatch) && same_match)
|
2019-10-17 21:08:28 +00:00
|
|
|
{
|
|
|
|
if (!allow_ambiguous)
|
|
|
|
throw Exception("Ambiguous column '" + identifier.name + "'", ErrorCodes::AMBIGUOUS_COLUMN_NAME);
|
2020-03-08 11:07:05 +00:00
|
|
|
best_match = ColumnMatch::Ambiguous;
|
|
|
|
return {};
|
2019-10-17 21:08:28 +00:00
|
|
|
}
|
2020-03-08 11:07:05 +00:00
|
|
|
|
|
|
|
if (best_match != ColumnMatch::NoMatch)
|
|
|
|
return best_table_pos;
|
|
|
|
return {};
|
2019-10-16 17:33:53 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2019-01-25 15:42:24 +00:00
|
|
|
std::optional<String> IdentifierSemantic::getColumnName(const ASTIdentifier & node)
|
|
|
|
{
|
|
|
|
if (!node.semantic->special)
|
|
|
|
return node.name;
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
std::optional<String> IdentifierSemantic::getColumnName(const ASTPtr & ast)
|
|
|
|
{
|
|
|
|
if (ast)
|
2019-03-11 13:22:51 +00:00
|
|
|
if (const auto * id = ast->as<ASTIdentifier>())
|
2019-01-25 15:42:24 +00:00
|
|
|
if (!id->semantic->special)
|
|
|
|
return id->name;
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
std::optional<String> IdentifierSemantic::getTableName(const ASTIdentifier & node)
|
|
|
|
{
|
|
|
|
if (node.semantic->special)
|
|
|
|
return node.name;
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
std::optional<String> IdentifierSemantic::getTableName(const ASTPtr & ast)
|
|
|
|
{
|
|
|
|
if (ast)
|
2019-03-11 13:22:51 +00:00
|
|
|
if (const auto * id = ast->as<ASTIdentifier>())
|
2019-01-25 15:42:24 +00:00
|
|
|
if (id->semantic->special)
|
|
|
|
return id->name;
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
2019-12-24 18:51:37 +00:00
|
|
|
std::optional<ASTIdentifier> IdentifierSemantic::uncover(const ASTIdentifier & identifier)
|
|
|
|
{
|
|
|
|
if (identifier.semantic->covered)
|
|
|
|
{
|
|
|
|
std::vector<String> name_parts = identifier.name_parts;
|
|
|
|
return ASTIdentifier(std::move(name_parts));
|
|
|
|
}
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
void IdentifierSemantic::coverName(ASTIdentifier & identifier, const String & alias)
|
|
|
|
{
|
|
|
|
identifier.setShortName(alias);
|
|
|
|
identifier.semantic->covered = true;
|
|
|
|
}
|
|
|
|
|
2019-02-11 19:14:57 +00:00
|
|
|
bool IdentifierSemantic::canBeAlias(const ASTIdentifier & identifier)
|
|
|
|
{
|
|
|
|
return identifier.semantic->can_be_alias;
|
|
|
|
}
|
|
|
|
|
2019-10-18 16:16:57 +00:00
|
|
|
void IdentifierSemantic::setMembership(ASTIdentifier & identifier, size_t table_pos)
|
2019-02-13 15:18:02 +00:00
|
|
|
{
|
2019-10-18 16:16:57 +00:00
|
|
|
identifier.semantic->membership = table_pos;
|
|
|
|
identifier.semantic->can_be_alias = false;
|
2019-02-13 15:18:02 +00:00
|
|
|
}
|
|
|
|
|
2019-10-18 16:16:57 +00:00
|
|
|
std::optional<size_t> IdentifierSemantic::getMembership(const ASTIdentifier & identifier)
|
2019-02-13 15:18:02 +00:00
|
|
|
{
|
|
|
|
return identifier.semantic->membership;
|
|
|
|
}
|
2019-02-11 19:14:57 +00:00
|
|
|
|
2020-03-08 11:07:05 +00:00
|
|
|
std::optional<size_t> IdentifierSemantic::chooseTable(const ASTIdentifier & identifier, const std::vector<DatabaseAndTableWithAlias> & tables,
|
|
|
|
bool ambiguous)
|
2019-10-16 14:47:58 +00:00
|
|
|
{
|
2020-03-08 11:07:05 +00:00
|
|
|
return tryChooseTable<DatabaseAndTableWithAlias>(identifier, tables, ambiguous);
|
2019-10-16 17:33:53 +00:00
|
|
|
}
|
2019-10-16 14:47:58 +00:00
|
|
|
|
2020-03-08 11:07:05 +00:00
|
|
|
std::optional<size_t> IdentifierSemantic::chooseTable(const ASTIdentifier & identifier, const std::vector<TableWithColumnNames> & tables,
|
|
|
|
bool ambiguous)
|
2019-10-16 17:33:53 +00:00
|
|
|
{
|
2020-03-08 11:07:05 +00:00
|
|
|
return tryChooseTable<TableWithColumnNames>(identifier, tables, ambiguous);
|
|
|
|
}
|
|
|
|
|
|
|
|
std::optional<size_t> IdentifierSemantic::chooseTable(const ASTIdentifier & identifier, const std::vector<TableWithColumnNamesAndTypes> & tables,
|
|
|
|
bool ambiguous)
|
|
|
|
{
|
|
|
|
return tryChooseTable<TableWithColumnNamesAndTypes>(identifier, tables, ambiguous);
|
2019-10-16 14:47:58 +00:00
|
|
|
}
|
|
|
|
|
2020-03-12 18:04:29 +00:00
|
|
|
StorageID IdentifierSemantic::extractDatabaseAndTable(const ASTIdentifier & identifier)
|
2019-01-25 15:42:24 +00:00
|
|
|
{
|
|
|
|
if (identifier.name_parts.size() > 2)
|
|
|
|
throw Exception("Logical error: more than two components in table expression", ErrorCodes::LOGICAL_ERROR);
|
|
|
|
|
|
|
|
if (identifier.name_parts.size() == 2)
|
2020-03-12 18:04:29 +00:00
|
|
|
return { identifier.name_parts[0], identifier.name_parts[1], identifier.uuid };
|
|
|
|
return { "", identifier.name, identifier.uuid };
|
2019-01-25 15:42:24 +00:00
|
|
|
}
|
|
|
|
|
2019-11-13 16:49:29 +00:00
|
|
|
std::optional<String> IdentifierSemantic::extractNestedName(const ASTIdentifier & identifier, const String & table_name)
|
|
|
|
{
|
|
|
|
if (identifier.name_parts.size() == 3 && table_name == identifier.name_parts[0])
|
|
|
|
return identifier.name_parts[1] + '.' + identifier.name_parts[2];
|
|
|
|
else if (identifier.name_parts.size() == 2)
|
|
|
|
return identifier.name_parts[0] + '.' + identifier.name_parts[1];
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
2019-01-25 15:42:24 +00:00
|
|
|
bool IdentifierSemantic::doesIdentifierBelongTo(const ASTIdentifier & identifier, const String & database, const String & table)
|
|
|
|
{
|
|
|
|
size_t num_components = identifier.name_parts.size();
|
|
|
|
if (num_components >= 3)
|
|
|
|
return identifier.name_parts[0] == database &&
|
|
|
|
identifier.name_parts[1] == table;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool IdentifierSemantic::doesIdentifierBelongTo(const ASTIdentifier & identifier, const String & table)
|
|
|
|
{
|
|
|
|
size_t num_components = identifier.name_parts.size();
|
|
|
|
if (num_components >= 2)
|
|
|
|
return identifier.name_parts[0] == table;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2019-10-17 21:08:28 +00:00
|
|
|
IdentifierSemantic::ColumnMatch IdentifierSemantic::canReferColumnToTable(const ASTIdentifier & identifier,
|
|
|
|
const DatabaseAndTableWithAlias & db_and_table)
|
2019-01-25 15:42:24 +00:00
|
|
|
{
|
|
|
|
/// database.table.column
|
|
|
|
if (doesIdentifierBelongTo(identifier, db_and_table.database, db_and_table.table))
|
2019-10-18 16:16:57 +00:00
|
|
|
return ColumnMatch::DbAndTable;
|
2019-01-25 15:42:24 +00:00
|
|
|
|
2019-10-17 21:08:28 +00:00
|
|
|
/// alias.column
|
|
|
|
if (doesIdentifierBelongTo(identifier, db_and_table.alias))
|
|
|
|
return ColumnMatch::TableAlias;
|
2019-01-25 15:42:24 +00:00
|
|
|
|
2019-10-17 21:08:28 +00:00
|
|
|
/// table.column
|
|
|
|
if (doesIdentifierBelongTo(identifier, db_and_table.table))
|
2019-01-25 15:42:24 +00:00
|
|
|
{
|
2019-10-18 16:16:57 +00:00
|
|
|
if (!db_and_table.alias.empty())
|
|
|
|
return ColumnMatch::AliasedTableName;
|
|
|
|
else
|
|
|
|
return ColumnMatch::TableName;
|
2019-01-25 15:42:24 +00:00
|
|
|
}
|
2019-10-18 16:16:57 +00:00
|
|
|
|
|
|
|
return ColumnMatch::NoMatch;
|
2019-01-25 15:42:24 +00:00
|
|
|
}
|
|
|
|
|
2020-03-08 11:07:05 +00:00
|
|
|
IdentifierSemantic::ColumnMatch IdentifierSemantic::canReferColumnToTable(const ASTIdentifier & identifier,
|
|
|
|
const TableWithColumnNames & db_and_table)
|
|
|
|
{
|
|
|
|
/// TODO: ColumnName match logic is disabled cause caller's code is not ready for it
|
|
|
|
return canReferColumnToTable(identifier, db_and_table.table);
|
|
|
|
}
|
|
|
|
|
|
|
|
IdentifierSemantic::ColumnMatch IdentifierSemantic::canReferColumnToTable(const ASTIdentifier & identifier,
|
|
|
|
const TableWithColumnNamesAndTypes & db_and_table)
|
|
|
|
{
|
|
|
|
ColumnMatch match = canReferColumnToTable(identifier, db_and_table.table);
|
|
|
|
if (match == ColumnMatch::NoMatch && identifier.isShort() && db_and_table.hasColumn(identifier.shortName()))
|
|
|
|
match = ColumnMatch::ColumnName;
|
|
|
|
return match;
|
|
|
|
}
|
|
|
|
|
2019-10-18 16:16:57 +00:00
|
|
|
/// Strip qualificators from left side of column name.
|
|
|
|
/// Example: 'database.table.name' -> 'name'.
|
|
|
|
void IdentifierSemantic::setColumnShortName(ASTIdentifier & identifier, const DatabaseAndTableWithAlias & db_and_table)
|
2019-01-25 15:42:24 +00:00
|
|
|
{
|
2019-10-17 21:08:28 +00:00
|
|
|
auto match = IdentifierSemantic::canReferColumnToTable(identifier, db_and_table);
|
|
|
|
size_t to_strip = 0;
|
|
|
|
switch (match)
|
|
|
|
{
|
|
|
|
case ColumnMatch::TableName:
|
2019-10-18 16:16:57 +00:00
|
|
|
case ColumnMatch::AliasedTableName:
|
2019-10-17 21:08:28 +00:00
|
|
|
case ColumnMatch::TableAlias:
|
|
|
|
to_strip = 1;
|
|
|
|
break;
|
2019-10-18 16:16:57 +00:00
|
|
|
case ColumnMatch::DbAndTable:
|
2019-10-17 21:08:28 +00:00
|
|
|
to_strip = 2;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
2019-02-07 19:18:40 +00:00
|
|
|
|
2019-10-18 16:16:57 +00:00
|
|
|
if (!to_strip)
|
|
|
|
return;
|
|
|
|
|
|
|
|
std::vector<String> stripped(identifier.name_parts.begin() + to_strip, identifier.name_parts.end());
|
2019-02-07 19:18:40 +00:00
|
|
|
|
2019-10-18 16:16:57 +00:00
|
|
|
DB::String new_name;
|
|
|
|
for (const auto & part : stripped)
|
|
|
|
{
|
|
|
|
if (!new_name.empty())
|
|
|
|
new_name += '.';
|
|
|
|
new_name += part;
|
|
|
|
}
|
|
|
|
identifier.name.swap(new_name);
|
2019-02-20 12:12:36 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void IdentifierSemantic::setColumnLongName(ASTIdentifier & identifier, const DatabaseAndTableWithAlias & db_and_table)
|
|
|
|
{
|
|
|
|
String prefix = db_and_table.getQualifiedNamePrefix();
|
|
|
|
if (!prefix.empty())
|
2019-02-07 19:18:40 +00:00
|
|
|
{
|
2019-02-20 12:12:36 +00:00
|
|
|
String short_name = identifier.shortName();
|
|
|
|
identifier.name = prefix + short_name;
|
|
|
|
prefix.resize(prefix.size() - 1); /// crop dot
|
|
|
|
identifier.name_parts = {prefix, short_name};
|
2019-02-07 19:18:40 +00:00
|
|
|
}
|
2019-01-25 15:42:24 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
}
|