ClickHouse/src/Parsers/TokenIterator.h

96 lines
2.3 KiB
C++
Raw Normal View History

#pragma once
2021-11-29 09:47:21 +00:00
#include <Core/Defines.h>
#include <Parsers/Lexer.h>
2021-11-29 09:47:21 +00:00
#include <vector>
namespace DB
{
/** Parser operates on lazy stream of tokens.
* It could do lookaheads of any depth.
*/
/** Used as an input for parsers.
* All whitespace and comment tokens are transparently skipped.
*/
class Tokens
{
private:
std::vector<Token> data;
Lexer lexer;
public:
2018-03-26 19:41:55 +00:00
Tokens(const char * begin, const char * end, size_t max_query_size = 0) : lexer(begin, end, max_query_size) {}
const Token & operator[] (size_t index)
{
while (true)
{
if (index < data.size())
return data[index];
if (!data.empty() && data.back().isEnd())
return data.back();
Token token = lexer.nextToken();
if (token.isSignificant())
data.emplace_back(token);
}
}
const Token & max()
{
if (data.empty())
return (*this)[0];
return data.back();
}
};
/// To represent position in a token stream.
class TokenIterator
{
private:
Tokens * tokens;
size_t index = 0;
public:
2019-08-03 11:02:40 +00:00
explicit TokenIterator(Tokens & tokens_) : tokens(&tokens_) {}
2021-11-29 09:47:21 +00:00
ALWAYS_INLINE const Token & get() { return (*tokens)[index]; }
ALWAYS_INLINE const Token & operator*() { return get(); }
ALWAYS_INLINE const Token * operator->() { return &get(); }
2021-11-29 09:47:21 +00:00
ALWAYS_INLINE TokenIterator & operator++()
{
++index;
return *this;
}
ALWAYS_INLINE TokenIterator & operator--()
{
--index;
return *this;
}
2021-11-29 09:47:21 +00:00
ALWAYS_INLINE bool operator<(const TokenIterator & rhs) const { return index < rhs.index; }
ALWAYS_INLINE bool operator<=(const TokenIterator & rhs) const { return index <= rhs.index; }
ALWAYS_INLINE bool operator==(const TokenIterator & rhs) const { return index == rhs.index; }
ALWAYS_INLINE bool operator!=(const TokenIterator & rhs) const { return index != rhs.index; }
2021-11-29 09:47:21 +00:00
ALWAYS_INLINE bool isValid() { return get().type < TokenType::EndOfStream; }
/// Rightmost token we had looked.
2021-11-29 09:47:21 +00:00
ALWAYS_INLINE const Token & max() { return tokens->max(); }
};
/// Returns positions of unmatched parentheses.
using UnmatchedParentheses = std::vector<Token>;
2021-01-31 23:10:41 +00:00
UnmatchedParentheses checkUnmatchedParentheses(TokenIterator begin);
}