ClickHouse/src/Storages/ConstraintsDescription.cpp

220 lines
7.2 KiB
C++
Raw Normal View History

#include <Storages/ConstraintsDescription.h>
#include <Interpreters/ExpressionAnalyzer.h>
#include <Interpreters/TreeRewriter.h>
#include <Parsers/formatAST.h>
#include <Parsers/ParserCreateQuery.h>
#include <Parsers/parseQuery.h>
#include <Parsers/ASTExpressionList.h>
2021-04-03 12:12:45 +00:00
#include <Parsers/ASTFunction.h>
#include <Core/Defines.h>
namespace DB
{
2021-05-06 08:29:24 +00:00
namespace ErrorCodes
{
extern const int LOGICAL_ERROR;
}
String ConstraintsDescription::toString() const
{
if (constraints.empty())
return {};
ASTExpressionList list;
for (const auto & constraint : constraints)
list.children.push_back(constraint);
return serializeAST(list, true);
}
ConstraintsDescription ConstraintsDescription::parse(const String & str)
{
if (str.empty())
return {};
ConstraintsDescription res;
ParserConstraintDeclarationList parser;
ASTPtr list = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
for (const auto & constraint : list->children)
2020-05-12 11:26:44 +00:00
res.constraints.push_back(constraint);
return res;
}
2021-01-04 20:55:32 +00:00
ASTs ConstraintsDescription::filterConstraints(ConstraintType selection) const
2021-01-03 15:02:00 +00:00
{
2021-01-04 20:55:32 +00:00
const auto ast_to_decr_constraint_type = [](ASTConstraintDeclaration::Type constraint_type) -> UInt32
{
switch (constraint_type)
{
case ASTConstraintDeclaration::Type::CHECK:
return static_cast<UInt32>(ConstraintType::CHECK);
case ASTConstraintDeclaration::Type::ASSUME:
return static_cast<UInt32>(ConstraintType::ASSUME);
}
2021-05-04 18:43:58 +00:00
throw Exception("Unknown constraint type.", ErrorCodes::LOGICAL_ERROR);
2021-01-04 20:55:32 +00:00
};
2021-01-03 15:02:00 +00:00
ASTs res;
res.reserve(constraints.size());
for (const auto & constraint : constraints)
{
2021-05-04 18:43:58 +00:00
if ((ast_to_decr_constraint_type(constraint->as<ASTConstraintDeclaration>()->type) & static_cast<UInt32>(selection)) != 0)
{
2021-01-03 15:02:00 +00:00
res.push_back(constraint);
}
}
return res;
}
2021-04-26 14:19:18 +00:00
std::vector<std::vector<CNFQuery::AtomicFormula>> ConstraintsDescription::buildConstraintData() const
2021-04-03 12:12:45 +00:00
{
std::vector<std::vector<CNFQuery::AtomicFormula>> constraint_data;
for (const auto & constraint : filterConstraints(ConstraintsDescription::ConstraintType::ALWAYS_TRUE))
{
const auto cnf = TreeCNFConverter::toCNF(constraint->as<ASTConstraintDeclaration>()->expr->ptr())
.pullNotOutFunctions(); /// TODO: move prepare stage to ConstraintsDescription
for (const auto & group : cnf.getStatements())
constraint_data.emplace_back(std::begin(group), std::end(group));
}
return constraint_data;
}
std::vector<CNFQuery::AtomicFormula> ConstraintsDescription::getAtomicConstraintData() const
{
std::vector<CNFQuery::AtomicFormula> constraint_data;
for (const auto & constraint : filterConstraints(ConstraintsDescription::ConstraintType::ALWAYS_TRUE))
{
2021-04-10 20:46:53 +00:00
Poco::Logger::get("atomic_formula: initial:").information(constraint->as<ASTConstraintDeclaration>()->expr->ptr()->dumpTree());
2021-04-03 12:12:45 +00:00
const auto cnf = TreeCNFConverter::toCNF(constraint->as<ASTConstraintDeclaration>()->expr->ptr())
2021-05-05 11:17:49 +00:00
.pullNotOutFunctions();
2021-05-04 18:43:58 +00:00
for (const auto & group : cnf.getStatements())
{
2021-04-03 12:12:45 +00:00
if (group.size() == 1)
constraint_data.push_back(*group.begin());
}
}
return constraint_data;
}
2021-04-26 14:19:18 +00:00
std::unique_ptr<ComparisonGraph> ConstraintsDescription::buildGraph() const
2021-04-03 12:12:45 +00:00
{
static const std::set<std::string> relations = {
"equals", "less", "lessOrEquals", "greaterOrEquals", "greater"};
std::vector<ASTPtr> constraints_for_graph;
auto atomic_formulas = getAtomicConstraintData();
2021-05-06 08:29:24 +00:00
for (const auto & atomic_formula : atomic_formulas)
2021-04-03 12:12:45 +00:00
{
2021-04-10 20:46:53 +00:00
Poco::Logger::get("atomic_formula: before:").information(atomic_formula.ast->dumpTree() + " " + std::to_string(atomic_formula.negative));
2021-05-06 08:29:24 +00:00
CNFQuery::AtomicFormula atom{atomic_formula.negative, atomic_formula.ast->clone()};
pushNotIn(atom);
auto * func = atom.ast->as<ASTFunction>();
2021-04-03 12:12:45 +00:00
if (func && relations.count(func->name))
{
2021-05-06 08:29:24 +00:00
if (atom.negative)
2021-04-03 12:12:45 +00:00
throw Exception(": ", ErrorCodes::LOGICAL_ERROR);
2021-05-06 08:29:24 +00:00
Poco::Logger::get("atomic_formula: after:").information(atom.ast->dumpTree() + " " + std::to_string(atom.negative));
constraints_for_graph.push_back(atom.ast);
2021-04-03 12:12:45 +00:00
}
}
2021-04-26 14:19:18 +00:00
return std::make_unique<ComparisonGraph>(constraints_for_graph);
2021-04-03 12:12:45 +00:00
}
ConstraintsExpressions ConstraintsDescription::getExpressions(const DB::ContextPtr context,
2019-05-25 14:07:45 +00:00
const DB::NamesAndTypesList & source_columns_) const
{
ConstraintsExpressions res;
res.reserve(constraints.size());
for (const auto & constraint : constraints)
{
2020-05-12 16:38:11 +00:00
auto * constraint_ptr = constraint->as<ASTConstraintDeclaration>();
2021-01-03 15:02:00 +00:00
if (constraint_ptr->type == ASTConstraintDeclaration::Type::CHECK)
{
// TreeRewriter::analyze has query as non-const argument so to avoid accidental query changes we clone it
ASTPtr expr = constraint_ptr->expr->clone();
auto syntax_result = TreeRewriter(context).analyze(expr, source_columns_);
res.push_back(ExpressionAnalyzer(constraint_ptr->expr->clone(), syntax_result, context).getActions(false));
}
2019-05-25 14:07:45 +00:00
}
return res;
}
2021-04-26 14:19:18 +00:00
const ComparisonGraph & ConstraintsDescription::getGraph() const
{
return *graph;
}
const std::vector<std::vector<CNFQuery::AtomicFormula>> & ConstraintsDescription::getConstraintData() const
{
return cnf_constraints;
}
const std::vector<ASTPtr> & ConstraintsDescription::getConstraints() const
{
return constraints;
}
2021-05-05 11:17:49 +00:00
std::optional<ConstraintsDescription::AtomIds> ConstraintsDescription::getAtomIds(const ASTPtr & ast) const
{
const auto hash = ast->getTreeHash();
if (ast_to_atom_ids.contains(hash))
return ast_to_atom_ids.at(hash);
return std::nullopt;
}
std::vector<CNFQuery::AtomicFormula> ConstraintsDescription::getAtomsById(const ConstraintsDescription::AtomIds & ids) const
{
std::vector<CNFQuery::AtomicFormula> result;
for (const auto & id : ids)
result.push_back(cnf_constraints[id.and_group][id.atom]);
return result;
}
2021-04-26 14:19:18 +00:00
void ConstraintsDescription::updateConstraints(const std::vector<ASTPtr> & constraints_)
{
constraints = constraints_;
update();
}
2020-06-05 17:29:40 +00:00
ConstraintsDescription::ConstraintsDescription(const ConstraintsDescription & other)
{
constraints.reserve(other.constraints.size());
for (const auto & constraint : other.constraints)
constraints.emplace_back(constraint->clone());
2021-04-26 14:19:18 +00:00
update();
2020-06-05 17:29:40 +00:00
}
ConstraintsDescription & ConstraintsDescription::operator=(const ConstraintsDescription & other)
{
constraints.resize(other.constraints.size());
for (size_t i = 0; i < constraints.size(); ++i)
constraints[i] = other.constraints[i]->clone();
2021-04-26 14:19:18 +00:00
update();
2020-06-05 17:29:40 +00:00
return *this;
}
2021-04-26 14:19:18 +00:00
void ConstraintsDescription::update()
{
cnf_constraints = buildConstraintData();
2021-05-05 11:17:49 +00:00
ast_to_atom_ids.clear();
for (size_t i = 0; i < cnf_constraints.size(); ++i)
{
for (size_t j = 0; j < cnf_constraints[i].size(); ++j)
{
ast_to_atom_ids[cnf_constraints[i][j].ast->getTreeHash()].push_back({i, j});
}
}
2021-04-26 14:19:18 +00:00
graph = buildGraph();
}
}