2014-03-10 12:25:37 +00:00
|
|
|
#pragma once
|
2010-06-24 19:12:10 +00:00
|
|
|
|
2017-07-13 04:20:56 +00:00
|
|
|
#include <set>
|
2014-03-10 14:47:04 +00:00
|
|
|
#include <memory>
|
2010-06-24 19:12:10 +00:00
|
|
|
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Core/Defines.h>
|
|
|
|
#include <Core/Types.h>
|
2020-01-14 11:11:01 +00:00
|
|
|
#include <Core/Settings.h>
|
|
|
|
#include <IO/WriteHelpers.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Parsers/IAST.h>
|
2017-07-10 03:28:12 +00:00
|
|
|
#include <Parsers/TokenIterator.h>
|
2010-06-24 19:12:10 +00:00
|
|
|
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2019-08-10 16:38:25 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
|
|
|
extern const int TOO_DEEP_RECURSION;
|
|
|
|
extern const int LOGICAL_ERROR;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2017-07-13 04:20:56 +00:00
|
|
|
/** Collects variants, how parser could proceed further at rightmost position.
|
|
|
|
*/
|
|
|
|
struct Expected
|
|
|
|
{
|
|
|
|
const char * max_parsed_pos = nullptr;
|
|
|
|
std::set<const char *> variants;
|
|
|
|
|
|
|
|
/// 'description' should be statically allocated string.
|
|
|
|
void add(const char * current_pos, const char * description)
|
|
|
|
{
|
|
|
|
if (!max_parsed_pos || current_pos > max_parsed_pos)
|
|
|
|
{
|
|
|
|
variants.clear();
|
|
|
|
max_parsed_pos = current_pos;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!max_parsed_pos || current_pos >= max_parsed_pos)
|
|
|
|
variants.insert(description);
|
|
|
|
}
|
|
|
|
|
|
|
|
void add(TokenIterator it, const char * description)
|
|
|
|
{
|
|
|
|
add(it->begin, description);
|
|
|
|
}
|
|
|
|
};
|
2014-06-12 00:48:56 +00:00
|
|
|
|
2010-06-24 19:12:10 +00:00
|
|
|
|
2017-05-27 17:29:55 +00:00
|
|
|
/** Interface for parser classes
|
2010-06-24 19:12:10 +00:00
|
|
|
*/
|
|
|
|
class IParser
|
|
|
|
{
|
|
|
|
public:
|
2019-08-10 16:38:25 +00:00
|
|
|
/// Token iterator augmented with depth information. This allows to control recursion depth.
|
|
|
|
struct Pos : TokenIterator
|
|
|
|
{
|
|
|
|
using TokenIterator::TokenIterator;
|
|
|
|
|
|
|
|
uint32_t depth = 0;
|
2020-01-14 11:11:01 +00:00
|
|
|
uint32_t max_depth = 0;
|
|
|
|
|
|
|
|
Pos(Tokens & tokens_, uint32_t max_depth_) : TokenIterator(tokens_), max_depth(max_depth_) {}
|
2019-08-10 16:38:25 +00:00
|
|
|
|
|
|
|
void increaseDepth()
|
|
|
|
{
|
|
|
|
++depth;
|
2020-01-14 11:11:01 +00:00
|
|
|
if (max_depth > 0 && depth > max_depth)
|
|
|
|
throw Exception("Maximum parse depth (" + toString(max_depth) + ") exceeded. Consider rising max_parser_depth parameter.", ErrorCodes::TOO_DEEP_RECURSION);
|
2019-08-10 16:38:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void decreaseDepth()
|
|
|
|
{
|
|
|
|
if (depth == 0)
|
|
|
|
throw Exception("Logical error in parser: incorrect calculation of parse depth", ErrorCodes::LOGICAL_ERROR);
|
|
|
|
--depth;
|
|
|
|
}
|
|
|
|
};
|
2010-06-24 19:12:10 +00:00
|
|
|
|
2017-05-27 17:29:55 +00:00
|
|
|
/** Get the text of this parser parses. */
|
2017-04-01 07:20:54 +00:00
|
|
|
virtual const char * getName() const = 0;
|
2010-06-24 19:12:10 +00:00
|
|
|
|
2017-05-27 17:29:55 +00:00
|
|
|
/** Parse piece of text from position `pos`, but not beyond end of line (`end` - position after end of line),
|
|
|
|
* move pointer `pos` to the maximum position to which it was possible to parse,
|
|
|
|
* in case of success return `true` and the result in `node` if it is needed, otherwise false,
|
|
|
|
* in `expected` write what was expected in the maximum position,
|
|
|
|
* to which it was possible to parse if parsing was unsuccessful,
|
|
|
|
* or what this parser parse if parsing was successful.
|
|
|
|
* The string to which the [begin, end) range is included may be not 0-terminated.
|
2017-04-01 07:20:54 +00:00
|
|
|
*/
|
2017-07-10 03:28:12 +00:00
|
|
|
virtual bool parse(Pos & pos, ASTPtr & node, Expected & expected) = 0;
|
2010-06-24 19:12:10 +00:00
|
|
|
|
2017-07-10 03:28:12 +00:00
|
|
|
bool ignore(Pos & pos, Expected & expected)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
|
|
|
ASTPtr ignore_node;
|
2017-07-10 03:28:12 +00:00
|
|
|
return parse(pos, ignore_node, expected);
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
2015-02-01 07:27:56 +00:00
|
|
|
|
2017-07-10 03:28:12 +00:00
|
|
|
bool ignore(Pos & pos)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
|
|
|
Expected expected;
|
2017-07-10 03:28:12 +00:00
|
|
|
return ignore(pos, expected);
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
2010-06-24 19:12:10 +00:00
|
|
|
|
2017-05-27 17:29:55 +00:00
|
|
|
/** The same, but do not move the position and do not write the result to node.
|
2017-04-01 07:20:54 +00:00
|
|
|
*/
|
2017-07-10 03:28:12 +00:00
|
|
|
bool check(Pos & pos, Expected & expected)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
|
|
|
Pos begin = pos;
|
|
|
|
ASTPtr node;
|
2017-07-10 03:28:12 +00:00
|
|
|
if (!parse(pos, node, expected))
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
|
|
|
pos = begin;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
return true;
|
|
|
|
}
|
2010-06-24 19:12:10 +00:00
|
|
|
|
2019-10-08 13:26:15 +00:00
|
|
|
/** The same, but doesn't move the position even if parsing was successful.
|
2018-11-14 22:46:39 +00:00
|
|
|
*/
|
2019-10-08 13:26:15 +00:00
|
|
|
bool checkWithoutMoving(Pos pos, Expected & expected)
|
2018-11-14 22:46:39 +00:00
|
|
|
{
|
|
|
|
ASTPtr node;
|
|
|
|
return parse(pos, node, expected);
|
|
|
|
}
|
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
virtual ~IParser() {}
|
2010-06-24 19:12:10 +00:00
|
|
|
};
|
|
|
|
|
2015-04-11 03:10:23 +00:00
|
|
|
using ParserPtr = std::unique_ptr<IParser>;
|
2014-04-13 08:52:50 +00:00
|
|
|
|
2010-06-24 19:12:10 +00:00
|
|
|
}
|