ClickHouse/src/Dictionaries/ExternalQueryBuilder.cpp

426 lines
11 KiB
C++
Raw Normal View History

#include "ExternalQueryBuilder.h"
#include <IO/WriteBuffer.h>
#include <IO/WriteBufferFromString.h>
#include <IO/WriteHelpers.h>
#include <boost/range/join.hpp>
#include "DictionaryStructure.h"
#include "writeParenthesisedString.h"
2016-12-08 02:49:04 +00:00
namespace DB
{
namespace ErrorCodes
{
extern const int UNSUPPORTED_METHOD;
extern const int LOGICAL_ERROR;
2016-12-08 02:49:04 +00:00
}
ExternalQueryBuilder::ExternalQueryBuilder(
const DictionaryStructure & dict_struct_,
const std::string & db_,
const std::string & schema_,
const std::string & table_,
const std::string & where_,
IdentifierQuotingStyle quoting_style_)
: dict_struct(dict_struct_), db(db_), schema(schema_), table(table_), where(where_), quoting_style(quoting_style_)
{}
2016-12-08 02:49:04 +00:00
void ExternalQueryBuilder::writeQuoted(const std::string & s, WriteBuffer & out) const
{
switch (quoting_style)
{
case IdentifierQuotingStyle::None:
writeString(s, out);
break;
case IdentifierQuotingStyle::Backticks:
writeBackQuotedString(s, out);
break;
case IdentifierQuotingStyle::DoubleQuotes:
writeDoubleQuotedString(s, out);
break;
case IdentifierQuotingStyle::BackticksMySQL:
writeBackQuotedStringMySQL(s, out);
break;
}
}
2016-12-08 02:49:04 +00:00
std::string ExternalQueryBuilder::composeLoadAllQuery() const
{
2017-07-31 21:39:24 +00:00
WriteBufferFromOwnString out;
2020-05-26 19:21:18 +00:00
composeLoadAllQuery(out);
writeChar(';', out);
return out.str();
}
void ExternalQueryBuilder::composeLoadAllQuery(WriteBuffer & out) const
{
2017-07-31 21:39:24 +00:00
writeString("SELECT ", out);
2017-07-31 21:39:24 +00:00
if (dict_struct.id)
{
if (!dict_struct.id->expression.empty())
2017-07-31 21:39:24 +00:00
{
writeParenthesisedString(dict_struct.id->expression, out);
2017-07-31 21:39:24 +00:00
writeString(" AS ", out);
}
writeQuoted(dict_struct.id->name, out);
2017-07-31 21:39:24 +00:00
if (dict_struct.range_min && dict_struct.range_max)
{
2017-07-31 21:39:24 +00:00
writeString(", ", out);
if (!dict_struct.range_min->expression.empty())
{
writeParenthesisedString(dict_struct.range_min->expression, out);
writeString(" AS ", out);
}
writeQuoted(dict_struct.range_min->name, out);
2017-07-31 21:39:24 +00:00
writeString(", ", out);
if (!dict_struct.range_max->expression.empty())
{
writeParenthesisedString(dict_struct.range_max->expression, out);
2017-07-31 21:39:24 +00:00
writeString(" AS ", out);
}
writeQuoted(dict_struct.range_max->name, out);
2017-07-31 21:39:24 +00:00
}
}
else if (dict_struct.key)
{
auto first = true;
for (const auto & key : *dict_struct.key)
{
2017-07-31 21:39:24 +00:00
if (!first)
writeString(", ", out);
first = false;
2017-07-31 21:39:24 +00:00
if (!key.expression.empty())
{
2017-07-31 21:39:24 +00:00
writeParenthesisedString(key.expression, out);
writeString(" AS ", out);
}
2017-07-31 21:39:24 +00:00
writeQuoted(key.name, out);
}
2017-07-31 21:39:24 +00:00
}
2017-07-31 21:39:24 +00:00
for (const auto & attr : dict_struct.attributes)
{
writeString(", ", out);
2017-07-31 21:39:24 +00:00
if (!attr.expression.empty())
{
2017-07-31 21:39:24 +00:00
writeParenthesisedString(attr.expression, out);
writeString(" AS ", out);
}
2017-07-31 21:39:24 +00:00
writeQuoted(attr.name, out);
}
2017-07-31 21:39:24 +00:00
writeString(" FROM ", out);
if (!db.empty())
{
writeQuoted(db, out);
writeChar('.', out);
}
if (!schema.empty())
{
writeQuoted(schema, out);
writeChar('.', out);
}
2017-07-31 21:39:24 +00:00
writeQuoted(table, out);
if (!where.empty())
{
writeString(" WHERE ", out);
writeString(where, out);
}
2016-12-08 02:49:04 +00:00
}
std::string ExternalQueryBuilder::composeUpdateQuery(const std::string & update_field, const std::string & time_point) const
{
2020-05-26 19:21:18 +00:00
WriteBufferFromOwnString out;
composeLoadAllQuery(out);
if (!where.empty())
2020-05-26 19:21:18 +00:00
writeString(" AND ", out);
else
2020-05-26 19:21:18 +00:00
writeString(" WHERE ", out);
2020-07-10 13:03:36 +00:00
writeString(update_field, out);
2020-05-26 19:21:18 +00:00
writeString(" >= '", out);
writeString(time_point, out);
writeChar('\'', out);
2020-05-26 19:21:18 +00:00
writeChar(';', out);
return out.str();
}
2016-12-08 02:49:04 +00:00
std::string ExternalQueryBuilder::composeLoadIdsQuery(const std::vector<UInt64> & ids)
{
if (!dict_struct.id)
2021-04-10 18:48:36 +00:00
throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Simple key required for method");
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
WriteBufferFromOwnString out;
writeString("SELECT ", out);
2016-12-08 02:49:04 +00:00
if (!dict_struct.id->expression.empty())
{
writeParenthesisedString(dict_struct.id->expression, out);
2017-07-31 21:39:24 +00:00
writeString(" AS ", out);
}
2016-12-08 02:49:04 +00:00
writeQuoted(dict_struct.id->name, out);
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
for (const auto & attr : dict_struct.attributes)
{
writeString(", ", out);
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
if (!attr.expression.empty())
{
2017-07-31 21:39:24 +00:00
writeParenthesisedString(attr.expression, out);
writeString(" AS ", out);
}
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
writeQuoted(attr.name, out);
}
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
writeString(" FROM ", out);
if (!db.empty())
{
writeQuoted(db, out);
writeChar('.', out);
}
if (!schema.empty())
{
writeQuoted(schema, out);
writeChar('.', out);
}
2017-07-31 21:39:24 +00:00
writeQuoted(table, out);
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
writeString(" WHERE ", out);
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
if (!where.empty())
{
writeString(where, out);
writeString(" AND ", out);
}
2016-12-08 02:49:04 +00:00
writeQuoted(dict_struct.id->name, out);
2017-07-31 21:39:24 +00:00
writeString(" IN (", out);
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
auto first = true;
for (const auto id : ids)
{
if (!first)
writeString(", ", out);
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
first = false;
writeString(DB::toString(id), out);
}
2016-12-08 02:49:04 +00:00
2017-07-31 21:39:24 +00:00
writeString(");", out);
return out.str();
2016-12-08 02:49:04 +00:00
}
std::string ExternalQueryBuilder::composeLoadKeysQuery(
const Columns & key_columns, const std::vector<size_t> & requested_rows, LoadKeysMethod method, size_t partition_key_prefix)
2016-12-08 02:49:04 +00:00
{
if (!dict_struct.key)
2021-04-10 18:48:36 +00:00
throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Composite key required for method");
if (key_columns.size() != dict_struct.key->size())
2021-04-10 18:48:36 +00:00
throw Exception(ErrorCodes::LOGICAL_ERROR, "The size of key_columns does not equal to the size of dictionary key");
2017-07-31 21:39:24 +00:00
WriteBufferFromOwnString out;
writeString("SELECT ", out);
2017-07-31 21:39:24 +00:00
auto first = true;
for (const auto & key_or_attribute : boost::join(*dict_struct.key, dict_struct.attributes))
{
2017-07-31 21:39:24 +00:00
if (!first)
writeString(", ", out);
2017-07-31 21:39:24 +00:00
first = false;
2017-07-31 21:39:24 +00:00
if (!key_or_attribute.expression.empty())
{
2017-07-31 21:39:24 +00:00
writeParenthesisedString(key_or_attribute.expression, out);
writeString(" AS ", out);
}
2017-07-31 21:39:24 +00:00
writeQuoted(key_or_attribute.name, out);
}
2017-07-31 21:39:24 +00:00
writeString(" FROM ", out);
if (!db.empty())
{
writeQuoted(db, out);
writeChar('.', out);
}
if (!schema.empty())
{
writeQuoted(schema, out);
writeChar('.', out);
}
2017-07-31 21:39:24 +00:00
writeQuoted(table, out);
2017-07-31 21:39:24 +00:00
writeString(" WHERE ", out);
2017-07-31 21:39:24 +00:00
if (!where.empty())
{
2020-06-03 15:07:37 +00:00
if (method != CASSANDRA_SEPARATE_PARTITION_KEY)
writeString("(", out);
2017-07-31 21:39:24 +00:00
writeString(where, out);
2020-06-03 15:07:37 +00:00
if (method != CASSANDRA_SEPARATE_PARTITION_KEY)
writeString(") AND (", out);
else
writeString(" AND ", out);
2017-07-31 21:39:24 +00:00
}
2017-07-31 21:39:24 +00:00
if (method == AND_OR_CHAIN)
{
first = true;
for (const auto row : requested_rows)
{
if (!first)
writeString(" OR ", out);
2017-07-31 21:39:24 +00:00
first = false;
writeString("(", out);
composeKeyCondition(key_columns, row, out, 0, key_columns.size());
writeString(")", out);
}
2017-07-31 21:39:24 +00:00
}
else if (method == IN_WITH_TUPLES)
2017-07-31 21:39:24 +00:00
{
composeInWithTuples(key_columns, requested_rows, out, 0, key_columns.size());
}
else /* if (method == CASSANDRA_SEPARATE_PARTITION_KEY) */
{
/// CQL does not allow using OR conditions
/// and does not allow using multi-column IN expressions with partition key columns.
/// So we have to use multiple queries with conditions like
/// (partition_key_1 = val1 AND partition_key_2 = val2 ...) AND (clustering_key_1, ...) IN ((val3, ...), ...)
/// for each partition key.
/// `partition_key_prefix` is a number of columns from partition key.
/// All `requested_rows` must have the same values of partition key.
composeKeyCondition(key_columns, requested_rows.at(0), out, 0, partition_key_prefix);
if (partition_key_prefix && partition_key_prefix < key_columns.size())
writeString(" AND ", out);
if (partition_key_prefix < key_columns.size())
composeInWithTuples(key_columns, requested_rows, out, partition_key_prefix, key_columns.size());
}
2020-06-03 15:07:37 +00:00
if (!where.empty() && method != CASSANDRA_SEPARATE_PARTITION_KEY)
2017-07-31 21:39:24 +00:00
{
writeString(")", out);
}
writeString(";", out);
return out.str();
2016-12-08 02:49:04 +00:00
}
void ExternalQueryBuilder::composeKeyCondition(const Columns & key_columns, const size_t row, WriteBuffer & out,
size_t beg, size_t end) const
2016-12-08 02:49:04 +00:00
{
auto first = true;
2021-06-15 19:55:21 +00:00
for (size_t i = beg; i < end; ++i)
{
if (!first)
writeString(" AND ", out);
2016-12-08 02:49:04 +00:00
first = false;
2016-12-08 02:49:04 +00:00
const auto & key_description = (*dict_struct.key)[i];
2016-12-08 02:49:04 +00:00
/// key_i=value_i
2020-05-26 19:21:18 +00:00
writeQuoted(key_description.name, out);
writeString("=", out);
2021-06-12 10:53:03 +00:00
key_description.type_serialization->serializeTextQuoted(*key_columns[i], row, out, format_settings);
}
}
void ExternalQueryBuilder::composeInWithTuples(const Columns & key_columns, const std::vector<size_t> & requested_rows,
WriteBuffer & out, size_t beg, size_t end)
{
composeKeyTupleDefinition(out, beg, end);
writeString(" IN (", out);
bool first = true;
for (const auto row : requested_rows)
{
if (!first)
writeString(", ", out);
first = false;
composeKeyTuple(key_columns, row, out, beg, end);
}
2016-12-08 02:49:04 +00:00
writeString(")", out);
2016-12-08 02:49:04 +00:00
}
void ExternalQueryBuilder::composeKeyTupleDefinition(WriteBuffer & out, size_t beg, size_t end) const
2016-12-08 02:49:04 +00:00
{
if (!dict_struct.key)
2021-04-10 18:48:36 +00:00
throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Composite key required for method");
2016-12-08 02:49:04 +00:00
2020-05-26 19:21:18 +00:00
writeChar('(', out);
2016-12-08 02:49:04 +00:00
auto first = true;
2021-06-15 19:55:21 +00:00
for (size_t i = beg; i < end; ++i)
{
if (!first)
2020-05-26 19:21:18 +00:00
writeString(", ", out);
2016-12-08 02:49:04 +00:00
first = false;
writeQuoted((*dict_struct.key)[i].name, out);
}
2016-12-08 02:49:04 +00:00
2020-05-26 19:21:18 +00:00
writeChar(')', out);
2016-12-08 02:49:04 +00:00
}
void ExternalQueryBuilder::composeKeyTuple(const Columns & key_columns, const size_t row, WriteBuffer & out, size_t beg, size_t end) const
2016-12-08 02:49:04 +00:00
{
writeString("(", out);
2016-12-08 02:49:04 +00:00
auto first = true;
2021-06-15 19:55:21 +00:00
for (size_t i = beg; i < end; ++i)
{
if (!first)
writeString(", ", out);
2016-12-08 02:49:04 +00:00
first = false;
2021-06-12 10:53:03 +00:00
auto serialization = (*dict_struct.key)[i].type_serialization;
2021-06-09 20:51:08 +00:00
serialization->serializeTextQuoted(*key_columns[i], row, out, format_settings);
}
2016-12-08 02:49:04 +00:00
writeString(")", out);
2016-12-08 02:49:04 +00:00
}
}