#include #include #include #include #include #include #include #include #include #include #include #include namespace DB { namespace ErrorCodes { extern const int SYNTAX_ERROR; } bool ParserSelectQuery::parseImpl(Pos & pos, Pos end, ASTPtr & node, Pos & max_parsed_pos, Expected & expected) { Pos begin = pos; auto select_query = std::make_shared(); node = select_query; ParserString s_select("SELECT", true, true); ParserString s_distinct("DISTINCT", true, true); ParserString s_from("FROM", true, true); ParserString s_left("LEFT", true, true); ParserString s_array("ARRAY", true, true); ParserString s_join("JOIN", true, true); ParserString s_using("USING", true, true); ParserString s_prewhere("PREWHERE", true, true); ParserString s_where("WHERE", true, true); ParserString s_final("FINAL", true, true); ParserString s_sample("SAMPLE", true, true); ParserString s_offset("OFFSET", true, true); ParserString s_group("GROUP", true, true); ParserString s_by("BY", true, true); ParserString s_with("WITH", true, true); ParserString s_totals("TOTALS", true, true); ParserString s_having("HAVING", true, true); ParserString s_order("ORDER", true, true); ParserString s_limit("LIMIT", true, true); ParserString s_settings("SETTINGS", true, true); ParserString s_union("UNION", true, true); ParserString s_all("ALL", true, true); ParserNotEmptyExpressionList exp_list(false); ParserNotEmptyExpressionList exp_list_for_select_clause(true); /// Разрешает алиасы без слова AS. ParserExpressionWithOptionalAlias exp_elem(false); ParserJoin join; ParserOrderByExpressionList order_list; ws.ignore(pos, end); /// SELECT [DISTINCT] expr list { if (!s_select.ignore(pos, end, max_parsed_pos, expected)) return false; ws.ignore(pos, end); if (s_distinct.ignore(pos, end, max_parsed_pos, expected)) { select_query->distinct = true; ws.ignore(pos, end); } if (!exp_list_for_select_clause.parse(pos, end, select_query->select_expression_list, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } /// FROM database.table или FROM table или FROM (subquery) или FROM tableFunction if (s_from.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); ParserWithOptionalAlias table_p(std::make_unique(), true); if (!table_p.parse(pos, end, select_query->table, max_parsed_pos, expected)) return false; /// Раскрываем составной идентификатор в имя БД и имя таблицы. NOTE Можно избавиться от этого в будущем. if (const ASTIdentifier * table_identifier = typeid_cast(select_query->table.get())) { if (table_identifier->children.size() > 2) throw Exception("Too many components to table. Table may be specified either in database.table or in table form", ErrorCodes::SYNTAX_ERROR); if (table_identifier->children.size() == 2) { select_query->database = table_identifier->children.at(0); typeid_cast(*select_query->database).kind = ASTIdentifier::Database; select_query->table = table_identifier->children.at(1); typeid_cast(*select_query->table).kind = ASTIdentifier::Table; } } ws.ignore(pos, end); } /** FINAL и SAMPLE может быть здесь или после всех JOIN-ов * (второй вариант был изначально сделан по ошибке, и его приходится поддерживать). */ auto parse_final_and_sample = [&]() -> bool { /// FINAL if (!select_query->final && s_final.ignore(pos, end, max_parsed_pos, expected)) { select_query->final = true; ws.ignore(pos, end); } /// SAMPLE number if (!select_query->sample_size && s_sample.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); ParserSampleRatio ratio; if (!ratio.parse(pos, end, select_query->sample_size, max_parsed_pos, expected)) return false; ws.ignore(pos, end); /// OFFSET number if (s_offset.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); if (!ratio.parse(pos, end, select_query->sample_offset, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } } return true; }; if (!parse_final_and_sample()) return false; /// [LEFT] ARRAY JOIN expr list Pos saved_pos = pos; bool has_array_join = false; if (s_left.ignore(pos, end, max_parsed_pos, expected) && ws.ignore(pos, end) && s_array.ignore(pos, end, max_parsed_pos, expected)) { select_query->array_join_is_left = true; has_array_join = true; } else { pos = saved_pos; if (s_array.ignore(pos, end, max_parsed_pos, expected)) has_array_join = true; } if (has_array_join) { ws.ignore(pos, end); if (!s_join.ignore(pos, end, max_parsed_pos, expected)) return false; ws.ignore(pos, end); if (!exp_list.parse(pos, end, select_query->array_join_expression_list, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } /// [GLOBAL] [ANY|ALL] INNER|LEFT|RIGHT|FULL|CROSS [OUTER] JOIN (subquery)|table_name USING tuple join.parse(pos, end, select_query->join, max_parsed_pos, expected); if (!parse_final_and_sample()) return false; /// PREWHERE expr if (s_prewhere.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); if (!exp_elem.parse(pos, end, select_query->prewhere_expression, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } /// WHERE expr if (s_where.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); if (!exp_elem.parse(pos, end, select_query->where_expression, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } /// GROUP BY expr list if (s_group.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); if (!s_by.ignore(pos, end, max_parsed_pos, expected)) return false; if (!exp_list.parse(pos, end, select_query->group_expression_list, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } /// WITH TOTALS if (s_with.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); if (!s_totals.ignore(pos, end, max_parsed_pos, expected)) return false; select_query->group_by_with_totals = true; ws.ignore(pos, end); } /// HAVING expr if (s_having.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); if (!exp_elem.parse(pos, end, select_query->having_expression, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } /// ORDER BY expr ASC|DESC COLLATE 'locale' list if (s_order.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); if (!s_by.ignore(pos, end, max_parsed_pos, expected)) return false; if (!order_list.parse(pos, end, select_query->order_expression_list, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } /// LIMIT length или LIMIT offset, length if (s_limit.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); ParserString s_comma(","); ParserNumber num; if (!num.parse(pos, end, select_query->limit_length, max_parsed_pos, expected)) return false; ws.ignore(pos, end); if (s_comma.ignore(pos, end, max_parsed_pos, expected)) { select_query->limit_offset = select_query->limit_length; if (!num.parse(pos, end, select_query->limit_length, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } } /// SETTINGS key1 = value1, key2 = value2, ... if (s_settings.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); ParserSetQuery parser_settings(true); if (!parser_settings.parse(pos, end, select_query->settings, max_parsed_pos, expected)) return false; ws.ignore(pos, end); } /// FORMAT format_name if (!parseFormat(*select_query, pos, end, node, max_parsed_pos, expected)) return false; // UNION ALL select query if (s_union.ignore(pos, end, max_parsed_pos, expected)) { ws.ignore(pos, end); if (s_all.ignore(pos, end, max_parsed_pos, expected)) { if (select_query->format) { /// FORMAT может быть задан только в последнем запросе цепочки UNION ALL. expected = "FORMAT only in the last SELECT of the UNION ALL chain"; return false; } ParserSelectQuery select_p; if (!select_p.parse(pos, end, select_query->next_union_all, max_parsed_pos, expected)) return false; auto next_select_query = static_cast(&*select_query->next_union_all); next_select_query->prev_union_all = node.get(); } else return false; ws.ignore(pos, end); } select_query->range = StringRange(begin, pos); select_query->children.push_back(select_query->select_expression_list); if (select_query->database) select_query->children.push_back(select_query->database); if (select_query->table) select_query->children.push_back(select_query->table); if (select_query->array_join_expression_list) select_query->children.push_back(select_query->array_join_expression_list); if (select_query->join) select_query->children.push_back(select_query->join); if (select_query->sample_size) select_query->children.push_back(select_query->sample_size); if (select_query->sample_offset) select_query->children.push_back(select_query->sample_offset); if (select_query->prewhere_expression) select_query->children.push_back(select_query->prewhere_expression); if (select_query->where_expression) select_query->children.push_back(select_query->where_expression); if (select_query->group_expression_list) select_query->children.push_back(select_query->group_expression_list); if (select_query->having_expression) select_query->children.push_back(select_query->having_expression); if (select_query->order_expression_list) select_query->children.push_back(select_query->order_expression_list); if (select_query->limit_offset) select_query->children.push_back(select_query->limit_offset); if (select_query->limit_length) select_query->children.push_back(select_query->limit_length); if (select_query->settings) select_query->children.push_back(select_query->settings); if (select_query->format) select_query->children.push_back(select_query->format); if (select_query->next_union_all) select_query->children.push_back(select_query->next_union_all); return true; } }