2017-07-12 04:17:05 +00:00
|
|
|
#pragma once
|
|
|
|
|
2021-11-29 09:47:21 +00:00
|
|
|
#include <Core/Defines.h>
|
2017-07-12 04:17:05 +00:00
|
|
|
#include <Parsers/Lexer.h>
|
|
|
|
|
2022-10-17 16:39:42 +00:00
|
|
|
#include <cassert>
|
2021-11-29 09:47:21 +00:00
|
|
|
#include <vector>
|
|
|
|
|
2017-07-12 04:17:05 +00:00
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
|
|
|
/** Parser operates on lazy stream of tokens.
|
|
|
|
* It could do lookaheads of any depth.
|
|
|
|
*/
|
|
|
|
|
2017-07-12 19:20:57 +00:00
|
|
|
/** Used as an input for parsers.
|
|
|
|
* All whitespace and comment tokens are transparently skipped.
|
|
|
|
*/
|
2017-07-12 04:17:05 +00:00
|
|
|
class Tokens
|
|
|
|
{
|
|
|
|
private:
|
|
|
|
std::vector<Token> data;
|
2022-10-17 10:06:28 +00:00
|
|
|
std::size_t last_accessed_index = 0;
|
2017-07-12 04:17:05 +00:00
|
|
|
|
|
|
|
public:
|
2023-05-25 14:05:44 +00:00
|
|
|
Tokens(const char * begin, const char * end, size_t max_query_size = 0, bool skip_insignificant = true);
|
2017-07-12 04:17:05 +00:00
|
|
|
|
2022-10-17 10:06:28 +00:00
|
|
|
ALWAYS_INLINE inline const Token & operator[](size_t index)
|
2017-07-12 20:45:27 +00:00
|
|
|
{
|
2022-10-17 16:39:42 +00:00
|
|
|
assert(index < data.size());
|
2022-10-17 10:06:28 +00:00
|
|
|
last_accessed_index = std::max(last_accessed_index, index);
|
|
|
|
return data[index];
|
2017-07-12 20:45:27 +00:00
|
|
|
}
|
2022-10-17 10:06:28 +00:00
|
|
|
|
|
|
|
ALWAYS_INLINE inline const Token & max() { return data[last_accessed_index]; }
|
2017-07-12 04:17:05 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
/// To represent position in a token stream.
|
|
|
|
class TokenIterator
|
|
|
|
{
|
|
|
|
private:
|
|
|
|
Tokens * tokens;
|
|
|
|
size_t index = 0;
|
|
|
|
|
|
|
|
public:
|
2019-08-03 11:02:40 +00:00
|
|
|
explicit TokenIterator(Tokens & tokens_) : tokens(&tokens_) {}
|
2017-07-12 04:17:05 +00:00
|
|
|
|
2021-11-29 09:47:21 +00:00
|
|
|
ALWAYS_INLINE const Token & get() { return (*tokens)[index]; }
|
|
|
|
ALWAYS_INLINE const Token & operator*() { return get(); }
|
|
|
|
ALWAYS_INLINE const Token * operator->() { return &get(); }
|
2017-07-12 04:17:05 +00:00
|
|
|
|
2021-11-29 09:47:21 +00:00
|
|
|
ALWAYS_INLINE TokenIterator & operator++()
|
|
|
|
{
|
|
|
|
++index;
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
ALWAYS_INLINE TokenIterator & operator--()
|
|
|
|
{
|
|
|
|
--index;
|
|
|
|
return *this;
|
|
|
|
}
|
2017-07-12 19:20:57 +00:00
|
|
|
|
2021-11-29 09:47:21 +00:00
|
|
|
ALWAYS_INLINE bool operator<(const TokenIterator & rhs) const { return index < rhs.index; }
|
|
|
|
ALWAYS_INLINE bool operator<=(const TokenIterator & rhs) const { return index <= rhs.index; }
|
|
|
|
ALWAYS_INLINE bool operator==(const TokenIterator & rhs) const { return index == rhs.index; }
|
|
|
|
ALWAYS_INLINE bool operator!=(const TokenIterator & rhs) const { return index != rhs.index; }
|
2017-07-12 04:17:05 +00:00
|
|
|
|
2021-11-29 09:47:21 +00:00
|
|
|
ALWAYS_INLINE bool isValid() { return get().type < TokenType::EndOfStream; }
|
2017-07-12 20:45:27 +00:00
|
|
|
|
2017-07-13 01:12:13 +00:00
|
|
|
/// Rightmost token we had looked.
|
2021-11-29 09:47:21 +00:00
|
|
|
ALWAYS_INLINE const Token & max() { return tokens->max(); }
|
2017-07-12 04:17:05 +00:00
|
|
|
};
|
|
|
|
|
2017-07-13 04:20:56 +00:00
|
|
|
|
|
|
|
/// Returns positions of unmatched parentheses.
|
2017-07-13 05:38:02 +00:00
|
|
|
using UnmatchedParentheses = std::vector<Token>;
|
2021-01-31 23:10:41 +00:00
|
|
|
UnmatchedParentheses checkUnmatchedParentheses(TokenIterator begin);
|
2017-07-13 04:20:56 +00:00
|
|
|
|
2017-07-12 04:17:05 +00:00
|
|
|
}
|