ClickHouse/src/Parsers/ExpressionElementParsers.h

482 lines
16 KiB
C++
Raw Normal View History

2011-09-04 05:14:52 +00:00
#pragma once
2010-06-24 19:12:10 +00:00
2020-03-19 01:15:01 +00:00
#include <Core/Field.h>
2020-12-15 11:35:11 +00:00
#include <Core/MultiEnum.h>
#include <Parsers/IParserBase.h>
2010-06-24 19:12:10 +00:00
namespace DB
{
class ParserArray : public IParserBase
{
protected:
const char * getName() const override { return "array"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2010-06-24 19:12:10 +00:00
};
2017-05-27 17:29:55 +00:00
/** If in parenthesis an expression from one element - returns this element in `node`;
* or if there is a SELECT subquery in parenthesis, then this subquery returned in `node`;
* otherwise returns `tuple` function from the contents of brackets.
2010-06-24 19:12:10 +00:00
*/
class ParserParenthesisExpression : public IParserBase
{
protected:
const char * getName() const override { return "parenthesized expression"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2010-06-24 19:12:10 +00:00
};
2017-05-27 17:29:55 +00:00
/** The SELECT subquery is in parenthesis.
2012-08-22 18:46:09 +00:00
*/
class ParserSubquery : public IParserBase
{
protected:
const char * getName() const override { return "SELECT subquery"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2012-08-22 18:46:09 +00:00
};
2017-05-27 17:29:55 +00:00
/** An identifier, for example, x_yz123 or `something special`
2020-11-02 13:15:40 +00:00
* If allow_query_parameter_ = true, also parses substitutions in form {name:Identifier}
2010-06-24 19:12:10 +00:00
*/
class ParserIdentifier : public IParserBase
{
2020-11-02 10:03:52 +00:00
public:
explicit ParserIdentifier(bool allow_query_parameter_ = false) : allow_query_parameter(allow_query_parameter_) {}
2010-06-24 19:12:10 +00:00
protected:
const char * getName() const override { return "identifier"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2020-11-02 10:03:52 +00:00
bool allow_query_parameter;
2010-06-24 19:12:10 +00:00
};
2020-04-06 23:22:44 +00:00
/** An identifier, possibly containing a dot, for example, x_yz123 or `something special` or Hits.EventTime,
* possibly with UUID clause like `db name`.`table name` UUID 'xxxxxxxx-xxxx-xxxx-xxxx-xxxxxxxxxxxx'
*/
class ParserCompoundIdentifier : public IParserBase
{
2020-04-06 23:22:44 +00:00
public:
explicit ParserCompoundIdentifier(bool table_name_with_optional_uuid_ = false, bool allow_query_parameter_ = false)
2020-11-02 10:03:52 +00:00
: table_name_with_optional_uuid(table_name_with_optional_uuid_), allow_query_parameter(allow_query_parameter_)
2020-10-26 15:49:00 +00:00
{
}
protected:
const char * getName() const override { return "compound identifier"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2020-04-07 14:05:51 +00:00
bool table_name_with_optional_uuid;
2020-11-02 10:03:52 +00:00
bool allow_query_parameter;
};
/** *, t.*, db.table.*, COLUMNS('<regular expression>') APPLY(...) or EXCEPT(...) or REPLACE(...)
*/
class ParserColumnsTransformers : public IParserBase
{
public:
enum class ColumnTransformer : UInt8
{
APPLY,
EXCEPT,
REPLACE,
};
using ColumnTransformers = MultiEnum<ColumnTransformer, UInt8>;
static constexpr auto AllTransformers = ColumnTransformers{ColumnTransformer::APPLY, ColumnTransformer::EXCEPT, ColumnTransformer::REPLACE};
explicit ParserColumnsTransformers(ColumnTransformers allowed_transformers_ = AllTransformers, bool is_strict_ = false)
: allowed_transformers(allowed_transformers_)
, is_strict(is_strict_)
{}
protected:
const char * getName() const override { return "COLUMNS transformers"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
ColumnTransformers allowed_transformers;
bool is_strict;
};
/// Just *
class ParserAsterisk : public IParserBase
{
public:
using ColumnTransformers = ParserColumnsTransformers::ColumnTransformers;
explicit ParserAsterisk(ColumnTransformers allowed_transformers_ = ParserColumnsTransformers::AllTransformers)
: allowed_transformers(allowed_transformers_)
{}
protected:
const char * getName() const override { return "asterisk"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
ColumnTransformers allowed_transformers;
};
/** Something like t.* or db.table.*
*/
class ParserQualifiedAsterisk : public IParserBase
{
protected:
const char * getName() const override { return "qualified asterisk"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2019-07-16 20:05:00 +00:00
/** COLUMNS('<regular expression>')
2019-07-12 11:17:38 +00:00
*/
2019-07-21 17:03:58 +00:00
class ParserColumnsMatcher : public IParserBase
2019-07-12 11:17:38 +00:00
{
public:
using ColumnTransformers = ParserColumnsTransformers::ColumnTransformers;
explicit ParserColumnsMatcher(ColumnTransformers allowed_transformers_ = ParserColumnsTransformers::AllTransformers)
: allowed_transformers(allowed_transformers_)
{}
2019-07-12 11:17:38 +00:00
protected:
const char * getName() const override { return "COLUMNS matcher"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
ColumnTransformers allowed_transformers;
2020-08-29 05:33:46 +00:00
};
2017-05-27 17:29:55 +00:00
/** A function, for example, f(x, y + 1, g(z)).
* Or an aggregate function: sum(x + f(y)), corr(x, y). The syntax is the same as the usual function.
* Or a parametric aggregate function: quantile(0.9)(x + y).
* Syntax - two pairs of parentheses instead of one. The first is for parameters, the second for arguments.
* For functions, the DISTINCT modifier can be specified, for example, count(DISTINCT x, y).
2010-06-24 19:12:10 +00:00
*/
class ParserFunction : public IParserBase
{
public:
explicit ParserFunction(bool allow_function_parameters_ = true, bool is_table_function_ = false)
: allow_function_parameters(allow_function_parameters_), is_table_function(is_table_function_)
{
}
2020-10-26 15:49:00 +00:00
2010-06-24 19:12:10 +00:00
protected:
const char * getName() const override { return "function"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
bool allow_function_parameters;
bool is_table_function;
};
// A special function parser for view table function.
// It parses an SELECT query as its argument and doesn't support getColumnName().
class ParserTableFunctionView : public IParserBase
{
protected:
const char * getName() const override { return "function"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2010-06-24 19:12:10 +00:00
};
2021-07-25 18:43:00 +00:00
// Allows to make queries like SELECT SUM(<expr>) FILTER(WHERE <cond>) FROM ...
class ParserFilterClause : public IParserBase
{
const char * getName() const override { return "filter"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2021-01-12 18:34:35 +00:00
// Window reference (the thing that goes after OVER) for window function.
// Can be either window name or window definition.
class ParserWindowReference : public IParserBase
{
const char * getName() const override { return "window reference"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2010-06-24 19:12:10 +00:00
};
2020-12-18 17:13:28 +00:00
class ParserWindowDefinition : public IParserBase
2020-12-16 21:44:05 +00:00
{
const char * getName() const override { return "window definition"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2021-01-12 18:34:35 +00:00
// The WINDOW clause of a SELECT query that defines a list of named windows.
// Returns an ASTExpressionList of ASTWindowListElement's.
class ParserWindowList : public IParserBase
{
const char * getName() const override { return "WINDOW clause"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2018-12-13 15:26:28 +00:00
class ParserCodecDeclarationList : public IParserBase
{
protected:
const char * getName() const override { return "codec declaration list"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2018-12-13 15:26:28 +00:00
};
/** Parse compression codec
* CODEC(ZSTD(2))
*/
class ParserCodec : public IParserBase
{
protected:
const char * getName() const override { return "codec"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2018-12-13 15:26:28 +00:00
};
2021-05-04 03:43:17 +00:00
/// Fast path of cast operator "::".
/// It tries to read literal as text.
/// If it fails, later operator will be transformed to function CAST.
/// Examples: "0.1::Decimal(38, 38)", "[1, 2]::Array(UInt8)"
class ParserCastOperator : public IParserBase
{
protected:
2021-05-04 03:43:17 +00:00
const char * getName() const override { return "CAST operator"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2017-01-23 15:55:56 +00:00
/** NULL literal.
2010-06-24 19:12:10 +00:00
*/
class ParserNull : public IParserBase
{
protected:
const char * getName() const override { return "NULL"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2010-06-24 19:12:10 +00:00
};
2021-11-06 07:19:12 +00:00
/** Bool literal.
*/
class ParserBool : public IParserBase
{
protected:
const char * getName() const override { return "Bool"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2010-06-24 19:12:10 +00:00
2017-01-23 15:55:56 +00:00
/** Numeric literal.
2010-06-24 19:12:10 +00:00
*/
class ParserNumber : public IParserBase
{
protected:
const char * getName() const override { return "number"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2010-06-24 19:12:10 +00:00
};
2017-01-23 15:55:56 +00:00
/** Unsigned integer, used in right hand side of tuple access operator (x.1).
*/
class ParserUnsignedInteger : public IParserBase
{
protected:
const char * getName() const override { return "unsigned integer"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2010-06-24 19:12:10 +00:00
2017-01-23 15:55:56 +00:00
/** String in single quotes.
2021-07-21 08:59:05 +00:00
* String in heredoc $here$txt$here$ equivalent to 'txt'.
2010-06-24 19:12:10 +00:00
*/
class ParserStringLiteral : public IParserBase
{
protected:
const char * getName() const override { return "string literal"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2020-03-19 01:15:01 +00:00
/** An array or tuple of literals.
* Arrays can also be parsed as an application of [] operator and tuples as an application of 'tuple' function.
* But parsing the whole array/tuple as a whole constant seriously speeds up the analysis of expressions in the case of very large collection.
* We try to parse the array or tuple as a collection of literals first (fast path),
* and if it did not work out (when the collection consists of complex expressions) -
* parse as an application of [] operator or 'tuple' function (slow path).
*/
2020-03-19 01:15:01 +00:00
template <typename Collection>
class ParserCollectionOfLiterals : public IParserBase
{
public:
ParserCollectionOfLiterals(TokenType opening_bracket_, TokenType closing_bracket_)
: opening_bracket(opening_bracket_), closing_bracket(closing_bracket_) {}
protected:
const char * getName() const override { return "collection of literals"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
private:
TokenType opening_bracket;
TokenType closing_bracket;
};
2020-03-24 12:55:35 +00:00
/// A tuple of literals with same type.
2020-03-19 01:15:01 +00:00
class ParserTupleOfLiterals : public IParserBase
{
public:
ParserCollectionOfLiterals<Tuple> tuple_parser{TokenType::OpeningRoundBracket, TokenType::ClosingRoundBracket};
protected:
const char * getName() const override { return "tuple"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override
{
return tuple_parser.parse(pos, node, expected);
}
};
class ParserArrayOfLiterals : public IParserBase
{
2020-03-19 01:15:01 +00:00
public:
ParserCollectionOfLiterals<Array> array_parser{TokenType::OpeningSquareBracket, TokenType::ClosingSquareBracket};
protected:
const char * getName() const override { return "array"; }
2020-03-19 01:15:01 +00:00
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override
{
return array_parser.parse(pos, node, expected);
}
2010-06-24 19:12:10 +00:00
};
2017-05-27 17:29:55 +00:00
/** The literal is one of: NULL, UInt64, Int64, Float64, String.
2010-06-24 19:12:10 +00:00
*/
class ParserLiteral : public IParserBase
{
protected:
const char * getName() const override { return "literal"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2010-06-24 19:12:10 +00:00
};
2017-05-27 17:29:55 +00:00
/** The alias is the identifier before which `AS` comes. For example: AS x_yz123.
2011-11-06 04:21:09 +00:00
*/
class ParserAlias : public IParserBase
2011-11-06 04:21:09 +00:00
{
public:
2020-10-26 15:49:00 +00:00
explicit ParserAlias(bool allow_alias_without_as_keyword_) : allow_alias_without_as_keyword(allow_alias_without_as_keyword_) { }
private:
static const char * restricted_keywords[];
bool allow_alias_without_as_keyword;
const char * getName() const override { return "alias"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2011-11-06 04:21:09 +00:00
};
2020-11-02 10:03:52 +00:00
/** Prepared statements.
* Parse query with parameter expression {name:type}.
*/
class ParserIdentifierOrSubstitution : public IParserBase
{
protected:
2020-11-02 13:15:40 +00:00
const char * getName() const override { return "identifier or substitution"; }
2020-11-02 10:03:52 +00:00
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2019-05-25 13:43:52 +00:00
/** Prepared statements.
2019-05-18 21:07:23 +00:00
* Parse query with parameter expression {name:type}.
*/
2019-05-25 13:43:52 +00:00
class ParserSubstitution : public IParserBase
2019-05-18 21:07:23 +00:00
{
protected:
const char * getName() const override { return "substitution"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2019-05-18 21:07:23 +00:00
};
/** MySQL-style global variable: @@var
*/
class ParserMySQLGlobalVariable : public IParserBase
{
protected:
const char * getName() const override { return "MySQL-style global variable"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2017-05-27 17:29:55 +00:00
/** The expression element is one of: an expression in parentheses, an array, a literal, a function, an identifier, an asterisk.
2010-06-24 19:12:10 +00:00
*/
class ParserExpressionElement : public IParserBase
{
protected:
const char * getName() const override { return "element of expression"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2010-06-24 19:12:10 +00:00
};
2017-05-27 17:29:55 +00:00
/** An expression element, possibly with an alias, if appropriate.
2011-11-06 04:21:09 +00:00
*/
class ParserWithOptionalAlias : public IParserBase
2011-11-06 04:21:09 +00:00
{
2011-11-06 20:47:07 +00:00
public:
ParserWithOptionalAlias(ParserPtr && elem_parser_, bool allow_alias_without_as_keyword_)
2019-10-31 15:22:48 +00:00
: elem_parser(std::move(elem_parser_)), allow_alias_without_as_keyword(allow_alias_without_as_keyword_) {}
2011-11-06 04:21:09 +00:00
protected:
ParserPtr elem_parser;
bool allow_alias_without_as_keyword;
const char * getName() const override { return "element of expression with optional alias"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2011-11-06 04:21:09 +00:00
};
/** Element of ORDER BY expression - same as expression element, but in addition, ASC[ENDING] | DESC[ENDING] could be specified
* and optionally, NULLS LAST|FIRST
* and optionally, COLLATE 'locale'.
* and optionally, WITH FILL [FROM x] [TO y] [STEP z]
2011-09-04 05:14:52 +00:00
*/
class ParserOrderByElement : public IParserBase
{
protected:
const char * getName() const override { return "element of ORDER BY expression"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2011-09-04 05:14:52 +00:00
};
2010-06-24 19:12:10 +00:00
/** Element of INTERPOLATE expression
*/
class ParserInterpolateElement : public IParserBase
{
protected:
const char * getName() const override { return "element of INTERPOLATE expression"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2019-10-07 16:23:16 +00:00
/** Parser for function with arguments like KEY VALUE (space separated)
2020-08-08 00:47:03 +00:00
* no commas allowed, just space-separated pairs.
2019-10-07 16:23:16 +00:00
*/
class ParserFunctionWithKeyValueArguments : public IParserBase
{
public:
2020-10-26 15:49:00 +00:00
explicit ParserFunctionWithKeyValueArguments(bool brackets_can_be_omitted_ = false) : brackets_can_be_omitted(brackets_can_be_omitted_)
{
}
2019-10-07 16:23:16 +00:00
protected:
2019-10-07 16:23:16 +00:00
const char * getName() const override { return "function with key-value arguments"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
/// brackets for function arguments can be omitted
bool brackets_can_be_omitted;
2019-10-07 16:23:16 +00:00
};
2020-06-18 12:52:05 +00:00
/** Table engine, possibly with parameters. See examples from ParserIdentifierWithParameters
2019-10-07 16:23:16 +00:00
* Parse result is ASTFunction, with or without arguments.
*/
class ParserIdentifierWithOptionalParameters : public IParserBase
{
protected:
const char * getName() const override{ return "identifier with optional parameters"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2019-10-07 16:23:16 +00:00
};
2019-10-09 13:02:05 +00:00
/** Element of TTL expression - same as expression element, but in addition,
* TO DISK 'xxx' | TO VOLUME 'xxx' | DELETE could be specified
*/
class ParserTTLElement : public IParserBase
{
protected:
const char * getName() const override { return "element of TTL expression"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
2019-10-09 13:02:05 +00:00
};
2021-01-12 00:40:07 +00:00
/// Part of the UPDATE command or TTL with GROUP BY of the form: col_name = expr
class ParserAssignment : public IParserBase
{
protected:
const char * getName() const override{ return "column assignment"; }
bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
};
2022-01-05 02:30:01 +00:00
ASTPtr createFunctionCast(const ASTPtr & expr_ast, const ASTPtr & type_ast);
2011-09-04 05:14:52 +00:00
}