ClickHouse/src/Parsers/ASTSelectQuery.cpp

521 lines
17 KiB
C++

#include <Common/typeid_cast.h>
#include <Parsers/ASTSetQuery.h>
#include <Parsers/ASTFunction.h>
#include <Parsers/ASTIdentifier.h>
#include <Parsers/ASTSelectQuery.h>
#include <Parsers/ASTOrderByElement.h>
#include <Parsers/ASTTablesInSelectQuery.h>
#include <Interpreters/StorageID.h>
#include <IO/Operators.h>
#include <Parsers/ASTLiteral.h>
#include <Common/FieldVisitorToString.h>
#include <Interpreters/QueryParameterVisitor.h>
#include <queue>
namespace DB
{
namespace ErrorCodes
{
extern const int NOT_IMPLEMENTED;
extern const int LOGICAL_ERROR;
}
ASTPtr ASTSelectQuery::clone() const
{
auto res = std::make_shared<ASTSelectQuery>(*this);
/** NOTE Members must clone exactly in the same order in which they were inserted into `children` in ParserSelectQuery.
* This is important because the AST hash depends on the children order and this hash is used for multiple things,
* like the column identifiers in the case of subqueries in the IN statement or caching scalar queries (reused in CTEs so it's
* important for them to have the same hash).
* For distributed query processing, in case one of the servers is localhost and the other one is not, localhost query is executed
* within the process and is cloned, and the request is sent to the remote server in text form via TCP.
* And if the cloning order does not match the parsing order then different servers will get different identifiers.
*
* Since the positions map uses <key, position> we can copy it as is and ensure the new children array is created / pushed
* in the same order as the existing one */
res->children.clear();
for (const auto & child : children)
res->children.push_back(child->clone());
return res;
}
void ASTSelectQuery::updateTreeHashImpl(SipHash & hash_state) const
{
hash_state.update(distinct);
hash_state.update(group_by_with_totals);
hash_state.update(group_by_with_rollup);
hash_state.update(group_by_with_cube);
hash_state.update(limit_with_ties);
IAST::updateTreeHashImpl(hash_state);
}
void ASTSelectQuery::formatImpl(const FormatSettings & s, FormatState & state, FormatStateStacked frame) const
{
frame.current_select = this;
frame.need_parens = false;
frame.expression_list_prepend_whitespace = true;
std::string indent_str = s.one_line ? "" : std::string(4 * frame.indent, ' ');
if (with())
{
s.ostr << (s.hilite ? hilite_keyword : "") << indent_str << "WITH" << (s.hilite ? hilite_none : "");
s.one_line
? with()->formatImpl(s, state, frame)
: with()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
s.ostr << s.nl_or_ws;
}
s.ostr << (s.hilite ? hilite_keyword : "") << indent_str << "SELECT" << (distinct ? " DISTINCT" : "") << (s.hilite ? hilite_none : "");
s.one_line
? select()->formatImpl(s, state, frame)
: select()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
if (tables())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "FROM" << (s.hilite ? hilite_none : "");
tables()->formatImpl(s, state, frame);
}
if (prewhere())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "PREWHERE " << (s.hilite ? hilite_none : "");
prewhere()->formatImpl(s, state, frame);
}
if (where())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "WHERE " << (s.hilite ? hilite_none : "");
where()->formatImpl(s, state, frame);
}
if (groupBy())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "GROUP BY" << (s.hilite ? hilite_none : "");
if (!group_by_with_grouping_sets)
{
s.one_line
? groupBy()->formatImpl(s, state, frame)
: groupBy()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
}
}
if (group_by_with_rollup)
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << (s.one_line ? "" : " ") << "WITH ROLLUP" << (s.hilite ? hilite_none : "");
if (group_by_with_cube)
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << (s.one_line ? "" : " ") << "WITH CUBE" << (s.hilite ? hilite_none : "");
if (group_by_with_grouping_sets)
{
auto nested_frame = frame;
nested_frame.surround_each_list_element_with_parens = true;
nested_frame.expression_list_prepend_whitespace = false;
nested_frame.indent++;
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << (s.one_line ? "" : " ") << "GROUPING SETS" << (s.hilite ? hilite_none : "");
s.ostr << " (";
s.one_line
? groupBy()->formatImpl(s, state, nested_frame)
: groupBy()->as<ASTExpressionList &>().formatImplMultiline(s, state, nested_frame);
s.ostr << ")";
}
if (group_by_with_totals)
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << (s.one_line ? "" : " ") << "WITH TOTALS" << (s.hilite ? hilite_none : "");
if (having())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "HAVING " << (s.hilite ? hilite_none : "");
having()->formatImpl(s, state, frame);
}
if (window())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str <<
"WINDOW" << (s.hilite ? hilite_none : "");
window()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
}
if (orderBy())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "ORDER BY" << (s.hilite ? hilite_none : "");
s.one_line
? orderBy()->formatImpl(s, state, frame)
: orderBy()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
if (interpolate())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "INTERPOLATE" << (s.hilite ? hilite_none : "");
if (!interpolate()->children.empty())
{
s.ostr << " (";
interpolate()->formatImpl(s, state, frame);
s.ostr << " )";
}
}
}
if (limitByLength())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "LIMIT " << (s.hilite ? hilite_none : "");
if (limitByOffset())
{
limitByOffset()->formatImpl(s, state, frame);
s.ostr << ", ";
}
limitByLength()->formatImpl(s, state, frame);
s.ostr << (s.hilite ? hilite_keyword : "") << " BY" << (s.hilite ? hilite_none : "");
s.one_line
? limitBy()->formatImpl(s, state, frame)
: limitBy()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
}
if (limitLength())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "LIMIT " << (s.hilite ? hilite_none : "");
if (limitOffset())
{
limitOffset()->formatImpl(s, state, frame);
s.ostr << ", ";
}
limitLength()->formatImpl(s, state, frame);
if (limit_with_ties)
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << " WITH TIES" << (s.hilite ? hilite_none : "");
}
else if (limitOffset())
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "OFFSET " << (s.hilite ? hilite_none : "");
limitOffset()->formatImpl(s, state, frame);
}
if (settings() && assert_cast<ASTSetQuery *>(settings().get())->print_in_format)
{
s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "SETTINGS " << (s.hilite ? hilite_none : "");
settings()->formatImpl(s, state, frame);
}
}
/// Compatibility functions. TODO Remove.
static const ASTTableExpression * getFirstTableExpression(const ASTSelectQuery & select)
{
if (!select.tables())
return {};
const auto & tables_in_select_query = select.tables()->as<ASTTablesInSelectQuery &>();
if (tables_in_select_query.children.empty())
return {};
const auto & tables_element = tables_in_select_query.children[0]->as<ASTTablesInSelectQueryElement &>();
if (!tables_element.table_expression)
return {};
return tables_element.table_expression->as<ASTTableExpression>();
}
static ASTTableExpression * getFirstTableExpression(ASTSelectQuery & select)
{
if (!select.tables())
return {};
auto & tables_in_select_query = select.tables()->as<ASTTablesInSelectQuery &>();
if (tables_in_select_query.children.empty())
return {};
auto & tables_element = tables_in_select_query.children[0]->as<ASTTablesInSelectQueryElement &>();
if (!tables_element.table_expression)
return {};
return tables_element.table_expression->as<ASTTableExpression>();
}
static const ASTArrayJoin * getFirstArrayJoin(const ASTSelectQuery & select)
{
if (!select.tables())
return {};
const auto & tables_in_select_query = select.tables()->as<ASTTablesInSelectQuery &>();
if (tables_in_select_query.children.empty())
return {};
const ASTArrayJoin * array_join = nullptr;
for (const auto & child : tables_in_select_query.children)
{
const auto & tables_element = child->as<ASTTablesInSelectQueryElement &>();
if (tables_element.array_join)
{
if (!array_join)
array_join = tables_element.array_join->as<ASTArrayJoin>();
else
throw Exception("Support for more than one ARRAY JOIN in query is not implemented", ErrorCodes::NOT_IMPLEMENTED);
}
}
return array_join;
}
static const ASTTablesInSelectQueryElement * getFirstTableJoin(const ASTSelectQuery & select)
{
if (!select.tables())
return nullptr;
const auto & tables_in_select_query = select.tables()->as<ASTTablesInSelectQuery &>();
if (tables_in_select_query.children.empty())
return nullptr;
const ASTTablesInSelectQueryElement * joined_table = nullptr;
for (const auto & child : tables_in_select_query.children)
{
const auto & tables_element = child->as<ASTTablesInSelectQueryElement &>();
if (tables_element.table_join)
{
if (!joined_table)
joined_table = &tables_element;
else
throw Exception("Multiple JOIN does not support the query.", ErrorCodes::NOT_IMPLEMENTED);
}
}
return joined_table;
}
ASTPtr ASTSelectQuery::sampleSize() const
{
const ASTTableExpression * table_expression = getFirstTableExpression(*this);
if (!table_expression)
return {};
return table_expression->sample_size;
}
ASTPtr ASTSelectQuery::sampleOffset() const
{
const ASTTableExpression * table_expression = getFirstTableExpression(*this);
if (!table_expression)
return {};
return table_expression->sample_offset;
}
bool ASTSelectQuery::final() const
{
const ASTTableExpression * table_expression = getFirstTableExpression(*this);
if (!table_expression)
return {};
return table_expression->final;
}
bool ASTSelectQuery::withFill() const
{
const ASTPtr order_by = orderBy();
if (!order_by)
return false;
for (const auto & order_expression_element : order_by->children)
if (order_expression_element->as<ASTOrderByElement &>().with_fill)
return true;
return false;
}
std::pair<ASTPtr, bool> ASTSelectQuery::arrayJoinExpressionList() const
{
const ASTArrayJoin * array_join = getFirstArrayJoin(*this);
if (!array_join)
return {};
bool is_left = (array_join->kind == ASTArrayJoin::Kind::Left);
return {array_join->expression_list, is_left};
}
const ASTTablesInSelectQueryElement * ASTSelectQuery::join() const
{
return getFirstTableJoin(*this);
}
bool ASTSelectQuery::hasJoin() const
{
if (!tables())
return false;
const auto & tables_in_select_query = tables()->as<ASTTablesInSelectQuery &>();
if (tables_in_select_query.children.empty())
return false;
for (const auto & child : tables_in_select_query.children)
{
const auto & tables_element = child->as<ASTTablesInSelectQueryElement &>();
if (tables_element.table_join)
return true;
}
return false;
}
static String getTableExpressionAlias(const ASTTableExpression * table_expression)
{
if (table_expression->subquery)
return table_expression->subquery->tryGetAlias();
else if (table_expression->table_function)
return table_expression->table_function->tryGetAlias();
else if (table_expression->database_and_table_name)
return table_expression->database_and_table_name->tryGetAlias();
return String();
}
void ASTSelectQuery::replaceDatabaseAndTable(const String & database_name, const String & table_name)
{
assert(database_name != "_temporary_and_external_tables");
replaceDatabaseAndTable(StorageID(database_name, table_name));
}
void ASTSelectQuery::replaceDatabaseAndTable(const StorageID & table_id)
{
ASTTableExpression * table_expression = getFirstTableExpression(*this);
if (!table_expression)
{
setExpression(Expression::TABLES, std::make_shared<ASTTablesInSelectQuery>());
auto element = std::make_shared<ASTTablesInSelectQueryElement>();
auto table_expr = std::make_shared<ASTTableExpression>();
element->table_expression = table_expr;
element->children.emplace_back(table_expr);
tables()->children.emplace_back(element);
table_expression = table_expr.get();
}
String table_alias = getTableExpressionAlias(table_expression);
table_expression->database_and_table_name = std::make_shared<ASTTableIdentifier>(table_id);
if (!table_alias.empty())
table_expression->database_and_table_name->setAlias(table_alias);
}
void ASTSelectQuery::addTableFunction(ASTPtr & table_function_ptr)
{
ASTTableExpression * table_expression = getFirstTableExpression(*this);
if (!table_expression)
{
setExpression(Expression::TABLES, std::make_shared<ASTTablesInSelectQuery>());
auto element = std::make_shared<ASTTablesInSelectQueryElement>();
auto table_expr = std::make_shared<ASTTableExpression>();
element->table_expression = table_expr;
element->children.emplace_back(table_expr);
tables()->children.emplace_back(element);
table_expression = table_expr.get();
}
String table_alias = getTableExpressionAlias(table_expression);
/// Maybe need to modify the alias, so we should clone new table_function node
table_expression->table_function = table_function_ptr->clone();
table_expression->database_and_table_name = nullptr;
if (table_alias.empty())
table_expression->table_function->setAlias(table_alias);
}
void ASTSelectQuery::setExpression(Expression expr, ASTPtr && ast)
{
if (ast)
{
auto it = positions.find(expr);
if (it == positions.end())
{
positions[expr] = children.size();
children.emplace_back(ast);
}
else
children[it->second] = ast;
}
else if (positions.contains(expr))
{
size_t pos = positions[expr];
children.erase(children.begin() + pos);
positions.erase(expr);
for (auto & pr : positions)
if (pr.second > pos)
--pr.second;
}
}
ASTPtr & ASTSelectQuery::getExpression(Expression expr)
{
if (!positions.contains(expr))
throw Exception("Get expression before set", ErrorCodes::LOGICAL_ERROR);
return children[positions[expr]];
}
void ASTSelectQuery::setFinal() // NOLINT method can be made const
{
auto & tables_in_select_query = tables()->as<ASTTablesInSelectQuery &>();
if (tables_in_select_query.children.empty())
throw Exception(ErrorCodes::LOGICAL_ERROR, "Tables list is empty, it's a bug");
auto & tables_element = tables_in_select_query.children[0]->as<ASTTablesInSelectQueryElement &>();
if (!tables_element.table_expression)
throw Exception(ErrorCodes::LOGICAL_ERROR, "There is no table expression, it's a bug");
tables_element.table_expression->as<ASTTableExpression &>().final = true;
}
bool ASTSelectQuery::hasQueryParameters() const
{
if (!analyzeReceiveQueryParams(this->clone()).empty())
{
return true;
}
return false;
}
NameToNameMap ASTSelectQuery::getQueryParameterValues() const
{
NameToNameMap parameter_values;
std::queue<ASTPtr> queue;
queue.push(this->clone());
while (!queue.empty())
{
auto ast = queue.front();
queue.pop();
if (const auto * expression_list = ast->as<ASTExpressionList>())
{
if (expression_list->children.size() == 2)
{
if (const auto * identifier = expression_list->children[0]->as<ASTIdentifier>())
{
if (const auto * literal = expression_list->children[1]->as<ASTLiteral>())
{
parameter_values[identifier->name()] = convertFieldToString(literal->value);
}
}
}
}
for (const auto & child : ast->children)
queue.push(child);
}
return parameter_values;
}
}