2018-11-02 18:53:23 +00:00
|
|
|
#pragma once
|
|
|
|
|
2019-10-19 20:36:35 +00:00
|
|
|
#include <Core/Block.h>
|
2019-09-03 16:56:32 +00:00
|
|
|
#include <Core/NamesAndTypes.h>
|
2019-01-25 11:43:19 +00:00
|
|
|
#include <Interpreters/Aliases.h>
|
2021-04-10 23:33:54 +00:00
|
|
|
#include <Interpreters/Context_fwd.h>
|
2020-03-03 14:25:45 +00:00
|
|
|
#include <Interpreters/DatabaseAndTableWithAlias.h>
|
2021-04-10 23:33:54 +00:00
|
|
|
#include <Interpreters/SelectQueryOptions.h>
|
2019-05-17 14:34:25 +00:00
|
|
|
#include <Storages/IStorage_fwd.h>
|
2018-11-02 18:53:23 +00:00
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2019-08-13 12:39:03 +00:00
|
|
|
class ASTFunction;
|
2020-06-25 20:59:10 +00:00
|
|
|
struct ASTTablesInSelectQueryElement;
|
2020-04-07 09:48:47 +00:00
|
|
|
class TableJoin;
|
2020-02-26 19:33:09 +00:00
|
|
|
struct Settings;
|
2019-09-03 16:56:32 +00:00
|
|
|
struct SelectQueryOptions;
|
2019-10-19 20:36:35 +00:00
|
|
|
using Scalars = std::map<String, Block>;
|
2020-06-17 16:39:58 +00:00
|
|
|
struct StorageInMemoryMetadata;
|
2020-06-18 11:02:31 +00:00
|
|
|
using StorageMetadataPtr = std::shared_ptr<const StorageInMemoryMetadata>;
|
2019-08-13 12:39:03 +00:00
|
|
|
|
2020-07-22 17:13:05 +00:00
|
|
|
struct TreeRewriterResult
|
2018-11-02 18:53:23 +00:00
|
|
|
{
|
2020-03-24 18:06:55 +00:00
|
|
|
ConstStoragePtr storage;
|
2020-06-17 16:39:58 +00:00
|
|
|
StorageMetadataPtr metadata_snapshot;
|
2020-04-07 09:48:47 +00:00
|
|
|
std::shared_ptr<TableJoin> analyzed_join;
|
2020-06-25 20:59:10 +00:00
|
|
|
const ASTTablesInSelectQueryElement * ast_join = nullptr;
|
2018-11-02 18:53:23 +00:00
|
|
|
|
2018-11-08 17:28:52 +00:00
|
|
|
NamesAndTypesList source_columns;
|
2020-03-03 14:25:45 +00:00
|
|
|
NameSet source_columns_set; /// Set of names of source_columns.
|
2019-08-09 14:50:04 +00:00
|
|
|
/// Set of columns that are enough to read from the table to evaluate the expression. It does not include joined columns.
|
|
|
|
NamesAndTypesList required_source_columns;
|
2021-06-17 15:00:03 +00:00
|
|
|
/// Same as above but also record alias columns which are expanded. This is for RBAC access check.
|
|
|
|
Names required_source_columns_before_expanding_alias_columns;
|
2018-11-08 17:28:52 +00:00
|
|
|
|
2021-06-15 10:28:13 +00:00
|
|
|
/// Set of alias columns that are expanded to their alias expressions. We still need the original columns to check access permission.
|
|
|
|
NameSet expanded_aliases;
|
|
|
|
|
2018-11-02 18:53:23 +00:00
|
|
|
Aliases aliases;
|
2019-08-13 12:39:03 +00:00
|
|
|
std::vector<const ASTFunction *> aggregates;
|
2018-11-02 18:53:23 +00:00
|
|
|
|
2020-12-22 01:37:45 +00:00
|
|
|
std::vector<const ASTFunction *> window_function_asts;
|
2020-12-09 11:14:40 +00:00
|
|
|
|
2018-11-02 18:53:23 +00:00
|
|
|
/// Which column is needed to be ARRAY-JOIN'ed to get the specified.
|
|
|
|
/// For example, for `SELECT s.v ... ARRAY JOIN a AS s` will get "s.v" -> "a.v".
|
|
|
|
NameToNameMap array_join_result_to_source;
|
|
|
|
|
|
|
|
/// For the ARRAY JOIN section, mapping from the alias to the full column name.
|
|
|
|
/// For example, for `ARRAY JOIN [1,2] AS b` "b" -> "array(1,2)" will enter here.
|
2018-11-08 15:43:14 +00:00
|
|
|
/// Note: not used further.
|
2018-11-02 18:53:23 +00:00
|
|
|
NameToNameMap array_join_alias_to_name;
|
|
|
|
|
|
|
|
/// The backward mapping for array_join_alias_to_name.
|
2018-11-08 15:43:14 +00:00
|
|
|
/// Note: not used further.
|
2018-11-02 18:53:23 +00:00
|
|
|
NameToNameMap array_join_name_to_alias;
|
|
|
|
|
|
|
|
/// Predicate optimizer overrides the sub queries
|
|
|
|
bool rewrite_subqueries = false;
|
2019-08-09 14:50:04 +00:00
|
|
|
|
2020-12-18 20:09:39 +00:00
|
|
|
/// Whether the query contains explicit columns like "SELECT column1 + column2 FROM table1".
|
|
|
|
/// Queries like "SELECT count() FROM table1", "SELECT 1" don't contain explicit columns.
|
|
|
|
bool has_explicit_columns = false;
|
|
|
|
|
|
|
|
/// Whether it's possible to use the trivial count optimization,
|
|
|
|
/// i.e. use a fast call of IStorage::totalRows() (or IStorage::totalRowsByPartitionPredicate())
|
|
|
|
/// instead of actual retrieving columns and counting rows.
|
2020-06-04 22:01:40 +00:00
|
|
|
bool optimize_trivial_count = false;
|
|
|
|
|
2020-11-13 15:56:25 +00:00
|
|
|
/// Cache isRemote() call for storage, because it may be too heavy.
|
|
|
|
bool is_remote_storage = false;
|
|
|
|
|
2019-10-19 20:36:35 +00:00
|
|
|
/// Results of scalar sub queries
|
|
|
|
Scalars scalars;
|
|
|
|
|
2020-07-22 17:13:05 +00:00
|
|
|
TreeRewriterResult(
|
2020-06-17 16:39:58 +00:00
|
|
|
const NamesAndTypesList & source_columns_,
|
|
|
|
ConstStoragePtr storage_ = {},
|
|
|
|
const StorageMetadataPtr & metadata_snapshot_ = {},
|
2020-11-13 15:56:25 +00:00
|
|
|
bool add_special = true);
|
2020-03-03 14:25:45 +00:00
|
|
|
|
2020-04-29 16:26:01 +00:00
|
|
|
void collectSourceColumns(bool add_special);
|
2020-06-04 22:01:40 +00:00
|
|
|
void collectUsedColumns(const ASTPtr & query, bool is_select);
|
2019-08-09 14:50:04 +00:00
|
|
|
Names requiredSourceColumns() const { return required_source_columns.getNames(); }
|
2021-06-17 15:00:03 +00:00
|
|
|
const Names & requiredSourceColumnsForAccessCheck() const { return required_source_columns_before_expanding_alias_columns; }
|
2020-12-12 16:42:15 +00:00
|
|
|
NameSet getArrayJoinSourceNameSet() const;
|
2021-06-15 10:28:13 +00:00
|
|
|
Names getExpandedAliases() const { return {expanded_aliases.begin(), expanded_aliases.end()}; }
|
2019-10-19 20:36:35 +00:00
|
|
|
const Scalars & getScalars() const { return scalars; }
|
2018-11-02 18:53:23 +00:00
|
|
|
};
|
|
|
|
|
2020-07-22 17:13:05 +00:00
|
|
|
using TreeRewriterResultPtr = std::shared_ptr<const TreeRewriterResult>;
|
2018-11-08 15:43:14 +00:00
|
|
|
|
2020-07-22 17:13:05 +00:00
|
|
|
/// Tree Rewriter in terms of CMU slides @sa https://15721.courses.cs.cmu.edu/spring2020/slides/19-optimizer1.pdf
|
|
|
|
///
|
|
|
|
/// Optimises AST tree and collect information for further expression analysis in ExpressionAnalyzer.
|
2018-11-08 11:17:31 +00:00
|
|
|
/// Result AST has the following invariants:
|
|
|
|
/// * all aliases are substituted
|
|
|
|
/// * qualified names are translated
|
|
|
|
/// * scalar subqueries are executed replaced with constants
|
|
|
|
/// * unneeded columns are removed from SELECT clause
|
|
|
|
/// * duplicated columns are removed from ORDER BY, LIMIT BY, USING(...).
|
2021-06-01 12:20:52 +00:00
|
|
|
class TreeRewriter : WithContext
|
2018-11-02 18:53:23 +00:00
|
|
|
{
|
|
|
|
public:
|
2021-06-01 12:20:52 +00:00
|
|
|
explicit TreeRewriter(ContextPtr context_) : WithContext(context_) {}
|
2018-11-08 11:17:31 +00:00
|
|
|
|
2020-02-26 19:33:09 +00:00
|
|
|
/// Analyze and rewrite not select query
|
2020-07-22 17:13:05 +00:00
|
|
|
TreeRewriterResultPtr analyze(
|
2020-06-17 16:39:58 +00:00
|
|
|
ASTPtr & query,
|
|
|
|
const NamesAndTypesList & source_columns_,
|
|
|
|
ConstStoragePtr storage = {},
|
|
|
|
const StorageMetadataPtr & metadata_snapshot = {},
|
2021-06-08 09:54:00 +00:00
|
|
|
bool allow_aggregations = false,
|
|
|
|
bool allow_self_aliases = true) const;
|
2020-02-26 19:33:09 +00:00
|
|
|
|
|
|
|
/// Analyze and rewrite select query
|
2020-07-22 17:13:05 +00:00
|
|
|
TreeRewriterResultPtr analyzeSelect(
|
2018-11-08 15:43:14 +00:00
|
|
|
ASTPtr & query,
|
2020-07-22 17:13:05 +00:00
|
|
|
TreeRewriterResult && result,
|
2020-02-26 19:33:09 +00:00
|
|
|
const SelectQueryOptions & select_options = {},
|
2020-03-03 14:25:45 +00:00
|
|
|
const std::vector<TableWithColumnNamesAndTypes> & tables_with_columns = {},
|
2020-04-08 18:59:52 +00:00
|
|
|
const Names & required_result_columns = {},
|
|
|
|
std::shared_ptr<TableJoin> table_join = {}) const;
|
2018-11-08 11:17:31 +00:00
|
|
|
|
2019-01-09 16:16:59 +00:00
|
|
|
private:
|
2021-06-07 20:59:38 +00:00
|
|
|
static void normalize(ASTPtr & query, Aliases & aliases, const NameSet & source_columns_set, bool ignore_alias, const Settings & settings, bool allow_self_aliases);
|
2018-11-02 18:53:23 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
}
|