2017-04-01 09:19:00 +00:00
|
|
|
#include <Common/formatReadable.h>
|
2019-10-07 18:56:03 +00:00
|
|
|
#include <Common/PODArray.h>
|
2017-07-13 20:58:19 +00:00
|
|
|
#include <Common/typeid_cast.h>
|
2020-08-18 21:41:01 +00:00
|
|
|
#include <Common/ThreadProfileEvents.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
|
|
|
|
#include <IO/ConcatReadBuffer.h>
|
|
|
|
#include <IO/WriteBufferFromFile.h>
|
2018-11-30 15:36:41 +00:00
|
|
|
#include <IO/WriteBufferFromVector.h>
|
|
|
|
#include <IO/LimitReadBuffer.h>
|
|
|
|
#include <IO/copyData.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
|
|
|
|
#include <DataStreams/BlockIO.h>
|
|
|
|
#include <DataStreams/copyData.h>
|
2019-01-23 14:48:50 +00:00
|
|
|
#include <DataStreams/IBlockInputStream.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <DataStreams/InputStreamFromASTInsertQuery.h>
|
|
|
|
#include <DataStreams/CountingBlockOutputStream.h>
|
|
|
|
|
2020-12-04 02:15:44 +00:00
|
|
|
#include <Parsers/ASTIdentifier.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Parsers/ASTInsertQuery.h>
|
2020-12-04 02:15:44 +00:00
|
|
|
#include <Parsers/ASTLiteral.h>
|
2020-05-21 18:01:25 +00:00
|
|
|
#include <Parsers/ASTSelectQuery.h>
|
2020-12-02 12:08:03 +00:00
|
|
|
#include <Parsers/ASTDropQuery.h>
|
|
|
|
#include <Parsers/ASTCreateQuery.h>
|
|
|
|
#include <Parsers/ASTRenameQuery.h>
|
|
|
|
#include <Parsers/ASTAlterQuery.h>
|
2020-11-02 19:23:26 +00:00
|
|
|
#include <Parsers/ASTSelectWithUnionQuery.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Parsers/ASTShowProcesslistQuery.h>
|
2020-06-15 20:01:58 +00:00
|
|
|
#include <Parsers/ASTWatchQuery.h>
|
|
|
|
#include <Parsers/Lexer.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
|
2020-12-04 02:15:44 +00:00
|
|
|
#if !defined(ARCADIA_BUILD)
|
|
|
|
# include <Parsers/New/parseQuery.h> // Y_IGNORE
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include <Parsers/parseQuery.h>
|
|
|
|
#include <Parsers/ParserQuery.h>
|
2020-12-02 12:08:03 +00:00
|
|
|
#include <Parsers/queryNormalization.h>
|
2020-12-04 02:15:44 +00:00
|
|
|
#include <Parsers/queryToString.h>
|
|
|
|
|
2019-05-28 18:30:10 +00:00
|
|
|
#include <Storages/StorageInput.h>
|
|
|
|
|
2020-03-07 17:37:38 +00:00
|
|
|
#include <Access/EnabledQuota.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Interpreters/InterpreterFactory.h>
|
|
|
|
#include <Interpreters/ProcessList.h>
|
2020-10-22 16:47:20 +00:00
|
|
|
#include <Interpreters/OpenTelemetrySpanLog.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Interpreters/QueryLog.h>
|
2019-01-23 19:23:37 +00:00
|
|
|
#include <Interpreters/InterpreterSetQuery.h>
|
2020-10-08 09:06:04 +00:00
|
|
|
#include <Interpreters/ApplyWithGlobalVisitor.h>
|
2019-05-18 21:07:23 +00:00
|
|
|
#include <Interpreters/ReplaceQueryParameterVisitor.h>
|
2020-12-18 06:54:38 +00:00
|
|
|
#include <Interpreters/SelectQueryOptions.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Interpreters/executeQuery.h>
|
2020-05-20 20:16:32 +00:00
|
|
|
#include <Interpreters/Context.h>
|
2019-07-19 07:44:18 +00:00
|
|
|
#include <Common/ProfileEvents.h>
|
2019-07-19 13:50:11 +00:00
|
|
|
|
2019-04-29 15:01:53 +00:00
|
|
|
#include <Interpreters/DNSCacheUpdater.h>
|
2019-09-06 17:48:27 +00:00
|
|
|
#include <Common/SensitiveDataMasker.h>
|
2011-10-30 11:30:52 +00:00
|
|
|
|
2019-03-26 18:28:37 +00:00
|
|
|
#include <Processors/Transforms/LimitsCheckingTransform.h>
|
2019-04-12 13:56:48 +00:00
|
|
|
#include <Processors/Transforms/MaterializingTransform.h>
|
2019-03-26 18:28:37 +00:00
|
|
|
#include <Processors/Formats/IOutputFormat.h>
|
2011-10-30 11:30:52 +00:00
|
|
|
|
2020-03-28 03:02:26 +00:00
|
|
|
|
2019-06-20 07:17:21 +00:00
|
|
|
namespace ProfileEvents
|
|
|
|
{
|
|
|
|
extern const Event QueryMaskingRulesMatch;
|
2020-05-21 18:01:25 +00:00
|
|
|
extern const Event FailedQuery;
|
|
|
|
extern const Event FailedInsertQuery;
|
|
|
|
extern const Event FailedSelectQuery;
|
2020-08-04 16:14:15 +00:00
|
|
|
extern const Event QueryTimeMicroseconds;
|
|
|
|
extern const Event SelectQueryTimeMicroseconds;
|
|
|
|
extern const Event InsertQueryTimeMicroseconds;
|
2019-06-20 07:17:21 +00:00
|
|
|
}
|
|
|
|
|
2011-10-30 11:30:52 +00:00
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2016-01-11 21:46:36 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
extern const int INTO_OUTFILE_NOT_ALLOWED;
|
2018-11-01 14:56:37 +00:00
|
|
|
extern const int QUERY_WAS_CANCELLED;
|
2016-01-11 21:46:36 +00:00
|
|
|
}
|
|
|
|
|
2011-10-30 11:30:52 +00:00
|
|
|
|
2018-03-11 00:15:26 +00:00
|
|
|
static void checkASTSizeLimits(const IAST & ast, const Settings & settings)
|
2012-12-26 20:29:28 +00:00
|
|
|
{
|
2018-03-11 00:15:26 +00:00
|
|
|
if (settings.max_ast_depth)
|
|
|
|
ast.checkDepth(settings.max_ast_depth);
|
|
|
|
if (settings.max_ast_elements)
|
|
|
|
ast.checkSize(settings.max_ast_elements);
|
2012-12-26 20:29:28 +00:00
|
|
|
}
|
2014-06-26 00:58:14 +00:00
|
|
|
|
2020-06-15 20:01:58 +00:00
|
|
|
|
2016-08-16 20:33:00 +00:00
|
|
|
static String joinLines(const String & query)
|
|
|
|
{
|
2020-06-15 20:01:58 +00:00
|
|
|
/// Care should be taken. We don't join lines inside non-whitespace tokens (e.g. multiline string literals)
|
2020-06-15 20:05:21 +00:00
|
|
|
/// and we don't join line after comment (because it can be single-line comment).
|
2020-06-15 20:01:58 +00:00
|
|
|
/// All other whitespaces replaced to a single whitespace.
|
|
|
|
|
|
|
|
String res;
|
|
|
|
const char * begin = query.data();
|
|
|
|
const char * end = begin + query.size();
|
|
|
|
|
|
|
|
Lexer lexer(begin, end);
|
|
|
|
Token token = lexer.nextToken();
|
|
|
|
for (; !token.isEnd(); token = lexer.nextToken())
|
|
|
|
{
|
|
|
|
if (token.type == TokenType::Whitespace)
|
|
|
|
{
|
|
|
|
res += ' ';
|
|
|
|
}
|
|
|
|
else if (token.type == TokenType::Comment)
|
|
|
|
{
|
|
|
|
res.append(token.begin, token.end);
|
|
|
|
if (token.end < end && *token.end == '\n')
|
|
|
|
res += '\n';
|
|
|
|
}
|
|
|
|
else
|
|
|
|
res.append(token.begin, token.end);
|
|
|
|
}
|
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return res;
|
2016-08-16 20:33:00 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2019-06-20 07:17:21 +00:00
|
|
|
static String prepareQueryForLogging(const String & query, Context & context)
|
|
|
|
{
|
|
|
|
String res = query;
|
|
|
|
|
2019-07-19 13:50:11 +00:00
|
|
|
// wiping sensitive data before cropping query by log_queries_cut_to_length,
|
|
|
|
// otherwise something like credit card without last digit can go to log
|
2020-04-22 06:01:33 +00:00
|
|
|
if (auto * masker = SensitiveDataMasker::getInstance())
|
2019-06-20 07:17:21 +00:00
|
|
|
{
|
|
|
|
auto matches = masker->wipeSensitiveData(res);
|
|
|
|
if (matches > 0)
|
|
|
|
{
|
|
|
|
ProfileEvents::increment(ProfileEvents::QueryMaskingRulesMatch, matches);
|
|
|
|
}
|
|
|
|
}
|
2019-07-19 13:50:11 +00:00
|
|
|
|
|
|
|
res = res.substr(0, context.getSettingsRef().log_queries_cut_to_length);
|
|
|
|
|
2019-06-20 07:17:21 +00:00
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2016-08-16 20:33:00 +00:00
|
|
|
/// Log query into text log (not into system table).
|
2019-03-04 18:28:42 +00:00
|
|
|
static void logQuery(const String & query, const Context & context, bool internal)
|
2015-06-17 21:34:15 +00:00
|
|
|
{
|
2019-03-04 18:28:42 +00:00
|
|
|
if (internal)
|
|
|
|
{
|
2020-05-30 21:57:37 +00:00
|
|
|
LOG_DEBUG(&Poco::Logger::get("executeQuery"), "(internal) {}", joinLines(query));
|
2019-03-04 18:28:42 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2020-09-08 13:19:27 +00:00
|
|
|
const auto & client_info = context.getClientInfo();
|
|
|
|
|
|
|
|
const auto & current_query_id = client_info.current_query_id;
|
|
|
|
const auto & initial_query_id = client_info.initial_query_id;
|
|
|
|
const auto & current_user = client_info.current_user;
|
2019-03-04 18:28:42 +00:00
|
|
|
|
2020-12-04 02:15:44 +00:00
|
|
|
LOG_DEBUG(&Poco::Logger::get("executeQuery"), "(from {}{}{}, using {} parser) {}",
|
2020-09-08 13:19:27 +00:00
|
|
|
client_info.current_address.toString(),
|
|
|
|
(current_user != "default" ? ", user: " + current_user : ""),
|
2020-05-23 21:41:35 +00:00
|
|
|
(!initial_query_id.empty() && current_query_id != initial_query_id ? ", initial_query_id: " + initial_query_id : std::string()),
|
2020-12-28 12:37:09 +00:00
|
|
|
(context.getSettingsRef().use_antlr_parser ? "new" : "old"),
|
2020-12-28 12:57:27 +00:00
|
|
|
(!context.getSettingsRef().log_comment.toString().empty()
|
|
|
|
&& context.getSettingsRef().log_comment.toString().length() <= context.getSettingsRef().max_query_size
|
2020-12-29 02:13:27 +00:00
|
|
|
? ", comment: " + context.getSettingsRef().log_comment.toString()
|
2020-12-28 12:37:09 +00:00
|
|
|
: std::string()),
|
2020-05-23 21:41:35 +00:00
|
|
|
joinLines(query));
|
2020-08-28 19:02:50 +00:00
|
|
|
|
2020-11-18 17:43:18 +00:00
|
|
|
if (client_info.client_trace_context.trace_id)
|
2020-09-08 13:19:27 +00:00
|
|
|
{
|
|
|
|
LOG_TRACE(&Poco::Logger::get("executeQuery"),
|
2020-11-18 17:43:18 +00:00
|
|
|
"OpenTelemetry traceparent '{}'",
|
|
|
|
client_info.client_trace_context.composeTraceparentHeader());
|
2020-09-08 13:19:27 +00:00
|
|
|
}
|
2019-03-04 18:28:42 +00:00
|
|
|
}
|
2016-08-16 20:33:00 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// Call this inside catch block.
|
|
|
|
static void setExceptionStackTrace(QueryLogElement & elem)
|
|
|
|
{
|
2019-10-10 16:30:33 +00:00
|
|
|
/// Disable memory tracker for stack trace.
|
|
|
|
/// Because if exception is "Memory limit (for query) exceed", then we probably can't allocate another one string.
|
2020-10-21 00:31:12 +00:00
|
|
|
MemoryTracker::BlockerInThread temporarily_disable_memory_tracker;
|
2019-10-10 16:30:33 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
try
|
|
|
|
{
|
|
|
|
throw;
|
|
|
|
}
|
2020-01-02 07:37:13 +00:00
|
|
|
catch (const std::exception & e)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2020-01-02 07:37:13 +00:00
|
|
|
elem.stack_trace = getExceptionStackTraceString(e);
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
catch (...) {}
|
2016-08-16 20:33:00 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// Log exception (with query info) into text log (not into system table).
|
|
|
|
static void logException(Context & context, QueryLogElement & elem)
|
|
|
|
{
|
2020-05-23 21:41:35 +00:00
|
|
|
if (elem.stack_trace.empty())
|
2020-05-30 21:57:37 +00:00
|
|
|
LOG_ERROR(&Poco::Logger::get("executeQuery"), "{} (from {}) (in query: {})",
|
2020-05-23 21:41:35 +00:00
|
|
|
elem.exception, context.getClientInfo().current_address.toString(), joinLines(elem.query));
|
|
|
|
else
|
2020-05-30 21:57:37 +00:00
|
|
|
LOG_ERROR(&Poco::Logger::get("executeQuery"), "{} (from {}) (in query: {})"
|
2020-05-23 21:41:35 +00:00
|
|
|
", Stack trace (when copying this message, always include the lines below):\n\n{}",
|
|
|
|
elem.exception, context.getClientInfo().current_address.toString(), joinLines(elem.query), elem.stack_trace);
|
2015-06-17 21:34:15 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 06:29:49 +00:00
|
|
|
inline UInt64 time_in_microseconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
|
|
|
|
{
|
|
|
|
return std::chrono::duration_cast<std::chrono::microseconds>(timepoint.time_since_epoch()).count();
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
inline UInt64 time_in_seconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
|
|
|
|
{
|
|
|
|
return std::chrono::duration_cast<std::chrono::seconds>(timepoint.time_since_epoch()).count();
|
|
|
|
}
|
2015-06-17 21:34:15 +00:00
|
|
|
|
2020-09-30 16:16:33 +00:00
|
|
|
static void onExceptionBeforeStart(const String & query_for_logging, Context & context, UInt64 current_time_us, ASTPtr ast)
|
2015-07-01 05:18:54 +00:00
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
/// Exception before the query execution.
|
2020-03-07 17:37:38 +00:00
|
|
|
if (auto quota = context.getQuota())
|
|
|
|
quota->used(Quota::ERRORS, 1, /* check_exceeded = */ false);
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2018-08-23 01:31:28 +00:00
|
|
|
const Settings & settings = context.getSettingsRef();
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
/// Log the start of query execution into the table if necessary.
|
2018-05-30 16:15:35 +00:00
|
|
|
QueryLogElement elem;
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2020-04-04 21:07:00 +00:00
|
|
|
elem.type = QueryLogElementType::EXCEPTION_BEFORE_START;
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2020-09-15 06:49:02 +00:00
|
|
|
// all callers to onExceptionBeforeStart method construct the timespec for event_time and
|
|
|
|
// event_time_microseconds from the same time point. So, it can be assumed that both of these
|
2020-10-27 11:04:03 +00:00
|
|
|
// times are equal up to the precision of a second.
|
2020-09-30 16:16:33 +00:00
|
|
|
elem.event_time = current_time_us / 1000000;
|
2020-10-01 15:41:48 +00:00
|
|
|
elem.event_time_microseconds = current_time_us;
|
2020-09-30 16:16:33 +00:00
|
|
|
elem.query_start_time = current_time_us / 1000000;
|
|
|
|
elem.query_start_time_microseconds = current_time_us;
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2020-07-22 04:00:16 +00:00
|
|
|
elem.current_database = context.getCurrentDatabase();
|
2019-06-20 07:17:21 +00:00
|
|
|
elem.query = query_for_logging;
|
2020-12-02 12:08:03 +00:00
|
|
|
elem.normalized_query_hash = normalizedQueryHash(query_for_logging);
|
|
|
|
|
|
|
|
// We don't calculate query_kind, databases, tables and columns when the query isn't able to start
|
|
|
|
|
2020-01-22 12:29:30 +00:00
|
|
|
elem.exception_code = getCurrentExceptionCode();
|
2018-05-30 16:15:35 +00:00
|
|
|
elem.exception = getCurrentExceptionMessage(false);
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2018-05-30 16:15:35 +00:00
|
|
|
elem.client_info = context.getClientInfo();
|
2016-10-24 21:40:39 +00:00
|
|
|
|
2020-12-29 02:13:27 +00:00
|
|
|
if (!settings.log_comment.toString().empty() && settings.log_comment.toString().length() <= settings.max_query_size)
|
2020-12-28 12:57:27 +00:00
|
|
|
elem.log_comment = settings.log_comment.toString();
|
|
|
|
|
2018-08-23 01:31:28 +00:00
|
|
|
if (settings.calculate_text_stack_trace)
|
|
|
|
setExceptionStackTrace(elem);
|
2018-05-30 16:15:35 +00:00
|
|
|
logException(context, elem);
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2018-06-19 20:30:35 +00:00
|
|
|
/// Update performance counters before logging to query_log
|
|
|
|
CurrentThread::finalizePerformanceCounters();
|
|
|
|
|
2020-10-29 19:28:46 +00:00
|
|
|
if (settings.log_queries && elem.type >= settings.log_queries_min_type && !settings.log_queries_min_query_duration_ms.totalMilliseconds())
|
2018-03-10 19:57:13 +00:00
|
|
|
if (auto query_log = context.getQueryLog())
|
|
|
|
query_log->add(elem);
|
2020-05-21 18:01:25 +00:00
|
|
|
|
2020-10-22 16:47:20 +00:00
|
|
|
if (auto opentelemetry_span_log = context.getOpenTelemetrySpanLog();
|
2020-11-18 17:43:18 +00:00
|
|
|
context.query_trace_context.trace_id
|
2020-10-22 16:47:20 +00:00
|
|
|
&& opentelemetry_span_log)
|
2020-08-27 18:44:20 +00:00
|
|
|
{
|
|
|
|
OpenTelemetrySpanLogElement span;
|
2020-11-18 17:43:18 +00:00
|
|
|
span.trace_id = context.query_trace_context.trace_id;
|
|
|
|
span.span_id = context.query_trace_context.span_id;
|
|
|
|
span.parent_span_id = context.getClientInfo().client_trace_context.span_id;
|
2020-08-27 18:44:20 +00:00
|
|
|
span.operation_name = "query";
|
2020-09-30 16:16:33 +00:00
|
|
|
span.start_time_us = current_time_us;
|
|
|
|
span.finish_time_us = current_time_us;
|
2020-08-27 18:44:20 +00:00
|
|
|
|
2020-11-12 23:27:18 +00:00
|
|
|
/// Keep values synchronized to type enum in QueryLogElement::createBlock.
|
2020-09-08 13:19:27 +00:00
|
|
|
span.attribute_names.push_back("clickhouse.query_status");
|
2020-08-27 18:44:20 +00:00
|
|
|
span.attribute_values.push_back("ExceptionBeforeStart");
|
|
|
|
|
2020-09-08 13:19:27 +00:00
|
|
|
span.attribute_names.push_back("db.statement");
|
2020-08-27 18:44:20 +00:00
|
|
|
span.attribute_values.push_back(elem.query);
|
|
|
|
|
2020-09-08 13:19:27 +00:00
|
|
|
span.attribute_names.push_back("clickhouse.query_id");
|
2020-08-27 18:44:20 +00:00
|
|
|
span.attribute_values.push_back(elem.client_info.current_query_id);
|
|
|
|
|
2020-11-18 17:43:18 +00:00
|
|
|
if (!context.query_trace_context.tracestate.empty())
|
2020-08-28 01:21:08 +00:00
|
|
|
{
|
2020-09-08 13:19:27 +00:00
|
|
|
span.attribute_names.push_back("clickhouse.tracestate");
|
2020-08-28 01:21:08 +00:00
|
|
|
span.attribute_values.push_back(
|
2020-11-18 17:43:18 +00:00
|
|
|
context.query_trace_context.tracestate);
|
2020-08-28 01:21:08 +00:00
|
|
|
}
|
|
|
|
|
2020-10-22 16:47:20 +00:00
|
|
|
opentelemetry_span_log->add(span);
|
2020-08-27 18:44:20 +00:00
|
|
|
}
|
|
|
|
|
2020-05-21 18:01:25 +00:00
|
|
|
ProfileEvents::increment(ProfileEvents::FailedQuery);
|
|
|
|
|
|
|
|
if (ast)
|
|
|
|
{
|
|
|
|
if (ast->as<ASTSelectQuery>() || ast->as<ASTSelectWithUnionQuery>())
|
|
|
|
{
|
|
|
|
ProfileEvents::increment(ProfileEvents::FailedSelectQuery);
|
|
|
|
}
|
|
|
|
else if (ast->as<ASTInsertQuery>())
|
|
|
|
{
|
|
|
|
ProfileEvents::increment(ProfileEvents::FailedInsertQuery);
|
|
|
|
}
|
|
|
|
}
|
2015-07-01 05:18:54 +00:00
|
|
|
}
|
|
|
|
|
2020-04-28 15:50:50 +00:00
|
|
|
static void setQuerySpecificSettings(ASTPtr & ast, Context & context)
|
|
|
|
{
|
|
|
|
if (auto * ast_insert_into = dynamic_cast<ASTInsertQuery *>(ast.get()))
|
|
|
|
{
|
|
|
|
if (ast_insert_into->watch)
|
2020-04-28 16:37:15 +00:00
|
|
|
context.setSetting("output_format_enable_streaming", 1);
|
2020-04-28 15:50:50 +00:00
|
|
|
}
|
|
|
|
}
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2015-06-18 02:11:05 +00:00
|
|
|
static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
|
2017-07-10 03:41:02 +00:00
|
|
|
const char * begin,
|
|
|
|
const char * end,
|
2017-04-01 07:20:54 +00:00
|
|
|
Context & context,
|
|
|
|
bool internal,
|
2019-02-08 13:24:24 +00:00
|
|
|
QueryProcessingStage::Enum stage,
|
2019-09-02 15:19:01 +00:00
|
|
|
bool has_query_tail,
|
2020-05-18 13:55:07 +00:00
|
|
|
ReadBuffer * istr)
|
2015-06-18 00:27:25 +00:00
|
|
|
{
|
2020-09-30 16:16:33 +00:00
|
|
|
const auto current_time = std::chrono::system_clock::now();
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2019-10-29 10:27:19 +00:00
|
|
|
/// If we already executing query and it requires to execute internal query, than
|
|
|
|
/// don't replace thread context with given (it can be temporary). Otherwise, attach context to thread.
|
|
|
|
if (!internal)
|
|
|
|
{
|
|
|
|
context.makeQueryContext();
|
|
|
|
CurrentThread::attachQueryContext(context);
|
|
|
|
}
|
2018-03-02 05:44:17 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
const Settings & settings = context.getSettingsRef();
|
|
|
|
|
|
|
|
ASTPtr ast;
|
2019-01-18 16:30:35 +00:00
|
|
|
const char * query_end;
|
2017-07-28 18:43:40 +00:00
|
|
|
|
|
|
|
/// Don't limit the size of internal queries.
|
|
|
|
size_t max_query_size = 0;
|
2020-12-04 02:15:44 +00:00
|
|
|
if (!internal) max_query_size = settings.max_query_size;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-12-02 12:08:03 +00:00
|
|
|
String query_database;
|
|
|
|
String query_table;
|
2017-04-01 07:20:54 +00:00
|
|
|
try
|
|
|
|
{
|
2020-12-04 02:15:44 +00:00
|
|
|
#if !defined(ARCADIA_BUILD)
|
|
|
|
if (settings.use_antlr_parser)
|
|
|
|
{
|
|
|
|
ast = parseQuery(begin, end, max_query_size, settings.max_parser_depth);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
ParserQuery parser(end);
|
|
|
|
|
|
|
|
/// TODO: parser should fail early when max_query_size limit is reached.
|
|
|
|
ast = parseQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
|
|
|
|
}
|
|
|
|
#else
|
|
|
|
ParserQuery parser(end);
|
|
|
|
|
|
|
|
/// TODO: parser should fail early when max_query_size limit is reached.
|
2020-01-14 11:11:01 +00:00
|
|
|
ast = parseQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
|
2020-12-04 02:15:44 +00:00
|
|
|
#endif
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-11-02 19:23:26 +00:00
|
|
|
/// Interpret SETTINGS clauses as early as possible (before invoking the corresponding interpreter),
|
|
|
|
/// to allow settings to take effect.
|
|
|
|
if (const auto * select_query = ast->as<ASTSelectQuery>())
|
|
|
|
{
|
|
|
|
if (auto new_settings = select_query->settings())
|
|
|
|
InterpreterSetQuery(new_settings, context).executeForCurrentContext();
|
|
|
|
}
|
|
|
|
else if (const auto * select_with_union_query = ast->as<ASTSelectWithUnionQuery>())
|
|
|
|
{
|
|
|
|
if (!select_with_union_query->list_of_selects->children.empty())
|
|
|
|
{
|
2020-11-05 09:25:42 +00:00
|
|
|
// We might have an arbitrarily complex UNION tree, so just give
|
|
|
|
// up if the last first-order child is not a plain SELECT.
|
|
|
|
// It is flattened later, when we process UNION ALL/DISTINCT.
|
|
|
|
const auto * last_select = select_with_union_query->list_of_selects->children.back()->as<ASTSelectQuery>();
|
|
|
|
if (last_select && last_select->settings())
|
|
|
|
{
|
|
|
|
InterpreterSetQuery(last_select->settings(), context).executeForCurrentContext();
|
|
|
|
}
|
2020-11-02 19:23:26 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
else if (const auto * query_with_output = dynamic_cast<const ASTQueryWithOutput *>(ast.get()))
|
|
|
|
{
|
|
|
|
if (query_with_output->settings_ast)
|
|
|
|
InterpreterSetQuery(query_with_output->settings_ast, context).executeForCurrentContext();
|
|
|
|
}
|
|
|
|
|
2020-12-02 12:08:03 +00:00
|
|
|
if (const auto * query_with_table_output = dynamic_cast<const ASTQueryWithTableAndOutput *>(ast.get()))
|
|
|
|
{
|
|
|
|
query_database = query_with_table_output->database;
|
|
|
|
query_table = query_with_table_output->table;
|
|
|
|
}
|
|
|
|
|
2019-03-11 13:22:51 +00:00
|
|
|
auto * insert_query = ast->as<ASTInsertQuery>();
|
2019-03-29 14:50:48 +00:00
|
|
|
|
|
|
|
if (insert_query && insert_query->settings_ast)
|
|
|
|
InterpreterSetQuery(insert_query->settings_ast, context).executeForCurrentContext();
|
|
|
|
|
2019-01-18 16:30:35 +00:00
|
|
|
if (insert_query && insert_query->data)
|
2019-02-08 13:24:24 +00:00
|
|
|
{
|
2019-01-18 16:30:35 +00:00
|
|
|
query_end = insert_query->data;
|
2019-02-08 13:24:24 +00:00
|
|
|
insert_query->has_tail = has_query_tail;
|
|
|
|
}
|
2019-01-18 16:30:35 +00:00
|
|
|
else
|
2019-06-15 18:22:48 +00:00
|
|
|
{
|
2019-01-18 16:30:35 +00:00
|
|
|
query_end = end;
|
2019-06-15 18:22:48 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
catch (...)
|
|
|
|
{
|
2019-03-04 18:28:42 +00:00
|
|
|
/// Anyway log the query.
|
|
|
|
String query = String(begin, begin + std::min(end - begin, static_cast<ptrdiff_t>(max_query_size)));
|
2019-06-20 07:17:21 +00:00
|
|
|
|
|
|
|
auto query_for_logging = prepareQueryForLogging(query, context);
|
|
|
|
logQuery(query_for_logging, context, internal);
|
2019-03-04 18:28:42 +00:00
|
|
|
|
2020-09-15 06:49:02 +00:00
|
|
|
if (!internal)
|
|
|
|
{
|
2020-09-30 16:16:33 +00:00
|
|
|
onExceptionBeforeStart(query_for_logging, context, time_in_microseconds(current_time), ast);
|
2020-09-15 01:40:06 +00:00
|
|
|
}
|
2015-06-18 00:27:25 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
throw;
|
|
|
|
}
|
2015-06-18 00:27:25 +00:00
|
|
|
|
2020-04-28 15:50:50 +00:00
|
|
|
setQuerySpecificSettings(ast, context);
|
|
|
|
|
2019-01-18 16:30:35 +00:00
|
|
|
/// Copy query into string. It will be written to log and presented in processlist. If an INSERT query, string will not include data to insertion.
|
|
|
|
String query(begin, query_end);
|
2017-04-01 07:20:54 +00:00
|
|
|
BlockIO res;
|
2015-06-18 00:27:25 +00:00
|
|
|
|
2020-03-09 00:28:05 +00:00
|
|
|
String query_for_logging;
|
2019-06-20 07:17:21 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
try
|
|
|
|
{
|
2019-06-15 18:22:48 +00:00
|
|
|
/// Replace ASTQueryParameter with ASTLiteral for prepared statements.
|
2019-06-16 17:32:37 +00:00
|
|
|
if (context.hasQueryParameters())
|
|
|
|
{
|
|
|
|
ReplaceQueryParameterVisitor visitor(context.getQueryParameters());
|
|
|
|
visitor.visit(ast);
|
2020-10-20 18:10:24 +00:00
|
|
|
query = serializeAST(*ast);
|
2020-10-08 09:06:04 +00:00
|
|
|
}
|
2019-06-15 18:22:48 +00:00
|
|
|
|
2020-10-20 18:10:24 +00:00
|
|
|
/// MUST goes before any modification (except for prepared statements,
|
|
|
|
/// since it substitute parameters and w/o them query does not contains
|
|
|
|
/// parameters), to keep query as-is in query_log and server log.
|
|
|
|
query_for_logging = prepareQueryForLogging(query, context);
|
|
|
|
logQuery(query_for_logging, context, internal);
|
|
|
|
|
2020-10-08 09:06:04 +00:00
|
|
|
/// Propagate WITH statement to children ASTSelect.
|
|
|
|
if (settings.enable_global_with_statement)
|
|
|
|
{
|
|
|
|
ApplyWithGlobalVisitor().visit(ast);
|
|
|
|
query = serializeAST(*ast);
|
2020-10-20 18:10:24 +00:00
|
|
|
}
|
2015-06-18 00:27:25 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
/// Check the limits.
|
2018-03-11 00:15:26 +00:00
|
|
|
checkASTSizeLimits(*ast, settings);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
/// Put query to process list. But don't put SHOW PROCESSLIST query itself.
|
|
|
|
ProcessList::EntryPtr process_list_entry;
|
2019-03-11 13:22:51 +00:00
|
|
|
if (!internal && !ast->as<ASTShowProcesslistQuery>())
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2019-06-20 07:17:21 +00:00
|
|
|
/// processlist also has query masked now, to avoid secrets leaks though SHOW PROCESSLIST by other users.
|
|
|
|
process_list_entry = context.getProcessList().insert(query_for_logging, ast.get(), context);
|
2017-04-01 07:20:54 +00:00
|
|
|
context.setProcessListElement(&process_list_entry->get());
|
|
|
|
}
|
|
|
|
|
2018-06-01 15:32:27 +00:00
|
|
|
/// Load external tables if they were provided
|
|
|
|
context.initializeExternalTablesIfSet();
|
|
|
|
|
2019-05-28 18:30:10 +00:00
|
|
|
auto * insert_query = ast->as<ASTInsertQuery>();
|
2019-05-30 20:12:44 +00:00
|
|
|
if (insert_query && insert_query->select)
|
2019-05-28 18:30:10 +00:00
|
|
|
{
|
2019-05-30 20:12:44 +00:00
|
|
|
/// Prepare Input storage before executing interpreter if we already got a buffer with data.
|
2019-05-28 18:30:10 +00:00
|
|
|
if (istr)
|
|
|
|
{
|
2019-05-30 20:12:44 +00:00
|
|
|
ASTPtr input_function;
|
2019-05-30 21:33:06 +00:00
|
|
|
insert_query->tryFindInputFunction(input_function);
|
2019-05-30 20:12:44 +00:00
|
|
|
if (input_function)
|
|
|
|
{
|
|
|
|
StoragePtr storage = context.executeTableFunction(input_function);
|
|
|
|
auto & input_storage = dynamic_cast<StorageInput &>(*storage);
|
2020-06-16 15:51:29 +00:00
|
|
|
auto input_metadata_snapshot = input_storage.getInMemoryMetadataPtr();
|
|
|
|
BlockInputStreamPtr input_stream = std::make_shared<InputStreamFromASTInsertQuery>(
|
|
|
|
ast, istr, input_metadata_snapshot->getSampleBlock(), context, input_function);
|
2019-05-30 20:12:44 +00:00
|
|
|
input_storage.setInputStream(input_stream);
|
|
|
|
}
|
2019-05-28 18:30:10 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
/// reset Input callbacks if query is not INSERT SELECT
|
|
|
|
context.resetInputCallbacks();
|
|
|
|
|
2020-12-18 06:54:38 +00:00
|
|
|
auto interpreter = InterpreterFactory::get(ast, context, SelectQueryOptions(stage).setInternal(internal));
|
2019-03-26 18:28:37 +00:00
|
|
|
|
2020-03-07 17:37:38 +00:00
|
|
|
std::shared_ptr<const EnabledQuota> quota;
|
2019-11-11 01:11:32 +00:00
|
|
|
if (!interpreter->ignoreQuota())
|
|
|
|
{
|
|
|
|
quota = context.getQuota();
|
2020-03-07 17:37:38 +00:00
|
|
|
if (quota)
|
|
|
|
{
|
|
|
|
quota->used(Quota::QUERIES, 1);
|
|
|
|
quota->checkExceeded(Quota::ERRORS);
|
|
|
|
}
|
2019-11-11 01:11:32 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 10:40:39 +00:00
|
|
|
StreamLocalLimits limits;
|
2019-11-11 01:11:32 +00:00
|
|
|
if (!interpreter->ignoreLimits())
|
|
|
|
{
|
2020-09-14 14:13:58 +00:00
|
|
|
limits.mode = LimitsMode::LIMITS_CURRENT;
|
2019-11-11 01:11:32 +00:00
|
|
|
limits.size_limits = SizeLimits(settings.max_result_rows, settings.max_result_bytes, settings.result_overflow_mode);
|
|
|
|
}
|
|
|
|
|
2020-11-09 15:07:38 +00:00
|
|
|
{
|
2020-11-19 15:52:11 +00:00
|
|
|
OpenTelemetrySpanHolder span("IInterpreter::execute()");
|
2020-11-09 15:07:38 +00:00
|
|
|
res = interpreter->execute();
|
|
|
|
}
|
|
|
|
|
2020-05-28 08:24:59 +00:00
|
|
|
QueryPipeline & pipeline = res.pipeline;
|
|
|
|
bool use_processors = pipeline.initialized();
|
2019-03-26 18:28:37 +00:00
|
|
|
|
2020-04-22 06:01:33 +00:00
|
|
|
if (const auto * insert_interpreter = typeid_cast<const InterpreterInsertQuery *>(&*interpreter))
|
2019-07-17 18:30:17 +00:00
|
|
|
{
|
|
|
|
/// Save insertion table (not table function). TODO: support remote() table function.
|
2020-03-02 20:23:58 +00:00
|
|
|
auto table_id = insert_interpreter->getDatabaseTable();
|
|
|
|
if (!table_id.empty())
|
|
|
|
context.setInsertionTable(std::move(table_id));
|
2019-07-17 18:30:17 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
if (process_list_entry)
|
2018-11-01 14:56:37 +00:00
|
|
|
{
|
|
|
|
/// Query was killed before execution
|
|
|
|
if ((*process_list_entry)->isKilled())
|
|
|
|
throw Exception("Query '" + (*process_list_entry)->getInfo().client_info.current_query_id + "' is killed in pending state",
|
|
|
|
ErrorCodes::QUERY_WAS_CANCELLED);
|
2019-03-26 18:28:37 +00:00
|
|
|
else if (!use_processors)
|
2018-11-01 14:56:37 +00:00
|
|
|
(*process_list_entry)->setQueryStreams(res);
|
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
/// Hold element of process list till end of query execution.
|
|
|
|
res.process_list_entry = process_list_entry;
|
|
|
|
|
2019-03-26 18:28:37 +00:00
|
|
|
if (use_processors)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2019-01-23 14:48:50 +00:00
|
|
|
/// Limits on the result, the quota on the result, and also callback for progress.
|
|
|
|
/// Limits apply only to the final result.
|
2019-11-11 01:11:32 +00:00
|
|
|
pipeline.setProgressCallback(context.getProgressCallback());
|
|
|
|
pipeline.setProcessListElement(context.getProcessListElement());
|
2020-05-27 18:20:26 +00:00
|
|
|
if (stage == QueryProcessingStage::Complete && !pipeline.isCompleted())
|
2019-01-23 14:48:50 +00:00
|
|
|
{
|
2019-03-26 18:28:37 +00:00
|
|
|
pipeline.resize(1);
|
2019-04-05 11:34:11 +00:00
|
|
|
pipeline.addSimpleTransform([&](const Block & header)
|
|
|
|
{
|
2019-03-26 18:28:37 +00:00
|
|
|
auto transform = std::make_shared<LimitsCheckingTransform>(header, limits);
|
|
|
|
transform->setQuota(quota);
|
|
|
|
return transform;
|
|
|
|
});
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
}
|
2019-03-26 18:28:37 +00:00
|
|
|
else
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2019-11-11 01:11:32 +00:00
|
|
|
/// Limits on the result, the quota on the result, and also callback for progress.
|
|
|
|
/// Limits apply only to the final result.
|
2019-03-26 18:28:37 +00:00
|
|
|
if (res.in)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2019-03-26 18:28:37 +00:00
|
|
|
res.in->setProgressCallback(context.getProgressCallback());
|
|
|
|
res.in->setProcessListElement(context.getProcessListElement());
|
|
|
|
if (stage == QueryProcessingStage::Complete)
|
|
|
|
{
|
2019-11-11 01:11:32 +00:00
|
|
|
if (!interpreter->ignoreQuota())
|
|
|
|
res.in->setQuota(quota);
|
|
|
|
if (!interpreter->ignoreLimits())
|
|
|
|
res.in->setLimits(limits);
|
2019-03-26 18:28:37 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (res.out)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2020-04-22 06:01:33 +00:00
|
|
|
if (auto * stream = dynamic_cast<CountingBlockOutputStream *>(res.out.get()))
|
2019-03-26 18:28:37 +00:00
|
|
|
{
|
|
|
|
stream->setProcessListElement(context.getProcessListElement());
|
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Everything related to query log.
|
|
|
|
{
|
|
|
|
QueryLogElement elem;
|
|
|
|
|
2020-04-04 21:07:00 +00:00
|
|
|
elem.type = QueryLogElementType::QUERY_START;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-09-30 16:16:33 +00:00
|
|
|
elem.event_time = time_in_seconds(current_time);
|
2020-10-01 15:41:48 +00:00
|
|
|
elem.event_time_microseconds = time_in_microseconds(current_time);
|
2020-09-30 16:16:33 +00:00
|
|
|
elem.query_start_time = time_in_seconds(current_time);
|
|
|
|
elem.query_start_time_microseconds = time_in_microseconds(current_time);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-07-22 04:00:16 +00:00
|
|
|
elem.current_database = context.getCurrentDatabase();
|
2019-06-20 07:17:21 +00:00
|
|
|
elem.query = query_for_logging;
|
2020-12-02 12:08:03 +00:00
|
|
|
elem.normalized_query_hash = normalizedQueryHash(query_for_logging);
|
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
elem.client_info = context.getClientInfo();
|
|
|
|
|
|
|
|
bool log_queries = settings.log_queries && !internal;
|
|
|
|
|
|
|
|
/// Log into system table start of query execution, if need.
|
2020-08-14 21:27:05 +00:00
|
|
|
if (log_queries)
|
2018-03-10 19:57:13 +00:00
|
|
|
{
|
2020-12-18 06:54:38 +00:00
|
|
|
if (use_processors)
|
|
|
|
{
|
|
|
|
const auto & info = context.getQueryAccessInfo();
|
|
|
|
elem.query_databases = info.databases;
|
|
|
|
elem.query_tables = info.tables;
|
|
|
|
elem.query_columns = info.columns;
|
|
|
|
}
|
|
|
|
|
|
|
|
interpreter->extendQueryLogElem(elem, ast, context, query_database, query_table);
|
|
|
|
|
2018-05-17 16:01:41 +00:00
|
|
|
if (settings.log_query_settings)
|
|
|
|
elem.query_settings = std::make_shared<Settings>(context.getSettingsRef());
|
|
|
|
|
2020-12-28 02:38:16 +00:00
|
|
|
if (!settings.log_comment.toString().empty() && settings.log_comment.toString().length() <= max_query_size)
|
|
|
|
elem.log_comment = settings.log_comment.toString();
|
|
|
|
|
2020-10-29 19:28:46 +00:00
|
|
|
if (elem.type >= settings.log_queries_min_type && !settings.log_queries_min_query_duration_ms.totalMilliseconds())
|
2020-08-14 21:27:05 +00:00
|
|
|
{
|
|
|
|
if (auto query_log = context.getQueryLog())
|
|
|
|
query_log->add(elem);
|
|
|
|
}
|
2018-03-10 19:57:13 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-08-04 16:14:15 +00:00
|
|
|
/// Common code for finish and exception callbacks
|
Fix gcc10 build by reducing storage of the lambdas in executeQuery
There is no need to capture query AST for the status_info_to_query_log,
since callers already captured it anyway.
gcc10 reports:
../src/Interpreters/executeQuery.cpp: In member function ‘void std::__1::function<_Rp(_ArgTypes ...)>::swap(std::__1::function<_Rp(_ArgTypes ...)>&) [with _Rp = void; _ArgTypes = {DB::IBlockInputStream*, DB::IBlockOutputStream*, DB::QueryPipeline*}]’:
../src/Interpreters/executeQuery.cpp:490:49: error: array subscript 35 is outside array bounds of ‘std::__1::aligned_storage<32, 16>::type [1]’ [-Werror=array-bounds]
490 | auto status_info_to_query_log = [ast](QueryLogElement &element, const QueryStatusInfo &info) mutable
| ^
In file included from ../contrib/libcxx/include/algorithm:644,
from ../contrib/libcxx/include/__string:57,
from ../contrib/libcxx/include/string_view:175,
from ../contrib/libcxx/include/string:504,
from ../src/Common/formatReadable.h:3, from ../src/Interpreters/executeQuery.cpp:1:
../contrib/libcxx/include/functional:1877:60: note: while referencing ‘__tempbuf’
1877 | typename aligned_storage<sizeof(__buf_)>::type __tempbuf;
| ^~~~~~~~~
2020-08-19 18:17:33 +00:00
|
|
|
auto status_info_to_query_log = [](QueryLogElement &element, const QueryStatusInfo &info, const ASTPtr query_ast) mutable
|
2020-08-04 16:14:15 +00:00
|
|
|
{
|
|
|
|
DB::UInt64 query_time = info.elapsed_seconds * 1000000;
|
|
|
|
ProfileEvents::increment(ProfileEvents::QueryTimeMicroseconds, query_time);
|
Fix gcc10 build by reducing storage of the lambdas in executeQuery
There is no need to capture query AST for the status_info_to_query_log,
since callers already captured it anyway.
gcc10 reports:
../src/Interpreters/executeQuery.cpp: In member function ‘void std::__1::function<_Rp(_ArgTypes ...)>::swap(std::__1::function<_Rp(_ArgTypes ...)>&) [with _Rp = void; _ArgTypes = {DB::IBlockInputStream*, DB::IBlockOutputStream*, DB::QueryPipeline*}]’:
../src/Interpreters/executeQuery.cpp:490:49: error: array subscript 35 is outside array bounds of ‘std::__1::aligned_storage<32, 16>::type [1]’ [-Werror=array-bounds]
490 | auto status_info_to_query_log = [ast](QueryLogElement &element, const QueryStatusInfo &info) mutable
| ^
In file included from ../contrib/libcxx/include/algorithm:644,
from ../contrib/libcxx/include/__string:57,
from ../contrib/libcxx/include/string_view:175,
from ../contrib/libcxx/include/string:504,
from ../src/Common/formatReadable.h:3, from ../src/Interpreters/executeQuery.cpp:1:
../contrib/libcxx/include/functional:1877:60: note: while referencing ‘__tempbuf’
1877 | typename aligned_storage<sizeof(__buf_)>::type __tempbuf;
| ^~~~~~~~~
2020-08-19 18:17:33 +00:00
|
|
|
if (query_ast->as<ASTSelectQuery>() || query_ast->as<ASTSelectWithUnionQuery>())
|
2020-08-04 16:14:15 +00:00
|
|
|
{
|
|
|
|
ProfileEvents::increment(ProfileEvents::SelectQueryTimeMicroseconds, query_time);
|
|
|
|
}
|
Fix gcc10 build by reducing storage of the lambdas in executeQuery
There is no need to capture query AST for the status_info_to_query_log,
since callers already captured it anyway.
gcc10 reports:
../src/Interpreters/executeQuery.cpp: In member function ‘void std::__1::function<_Rp(_ArgTypes ...)>::swap(std::__1::function<_Rp(_ArgTypes ...)>&) [with _Rp = void; _ArgTypes = {DB::IBlockInputStream*, DB::IBlockOutputStream*, DB::QueryPipeline*}]’:
../src/Interpreters/executeQuery.cpp:490:49: error: array subscript 35 is outside array bounds of ‘std::__1::aligned_storage<32, 16>::type [1]’ [-Werror=array-bounds]
490 | auto status_info_to_query_log = [ast](QueryLogElement &element, const QueryStatusInfo &info) mutable
| ^
In file included from ../contrib/libcxx/include/algorithm:644,
from ../contrib/libcxx/include/__string:57,
from ../contrib/libcxx/include/string_view:175,
from ../contrib/libcxx/include/string:504,
from ../src/Common/formatReadable.h:3, from ../src/Interpreters/executeQuery.cpp:1:
../contrib/libcxx/include/functional:1877:60: note: while referencing ‘__tempbuf’
1877 | typename aligned_storage<sizeof(__buf_)>::type __tempbuf;
| ^~~~~~~~~
2020-08-19 18:17:33 +00:00
|
|
|
else if (query_ast->as<ASTInsertQuery>())
|
2020-08-04 16:14:15 +00:00
|
|
|
{
|
|
|
|
ProfileEvents::increment(ProfileEvents::InsertQueryTimeMicroseconds, query_time);
|
|
|
|
}
|
|
|
|
|
|
|
|
element.query_duration_ms = info.elapsed_seconds * 1000;
|
|
|
|
|
|
|
|
element.read_rows = info.read_rows;
|
|
|
|
element.read_bytes = info.read_bytes;
|
|
|
|
|
|
|
|
element.written_rows = info.written_rows;
|
|
|
|
element.written_bytes = info.written_bytes;
|
|
|
|
|
|
|
|
element.memory_usage = info.peak_memory_usage > 0 ? info.peak_memory_usage : 0;
|
|
|
|
|
|
|
|
element.thread_ids = std::move(info.thread_ids);
|
|
|
|
element.profile_counters = std::move(info.profile_counters);
|
|
|
|
};
|
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
/// Also make possible for caller to log successful query finish and exception during execution.
|
2020-10-29 19:28:46 +00:00
|
|
|
auto finish_callback = [elem, &context, ast,
|
|
|
|
log_queries,
|
|
|
|
log_queries_min_type = settings.log_queries_min_type,
|
|
|
|
log_queries_min_query_duration_ms = settings.log_queries_min_query_duration_ms.totalMilliseconds(),
|
|
|
|
status_info_to_query_log
|
|
|
|
]
|
2020-07-02 14:51:10 +00:00
|
|
|
(IBlockInputStream * stream_in, IBlockOutputStream * stream_out, QueryPipeline * query_pipeline) mutable
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2018-02-01 17:55:08 +00:00
|
|
|
QueryStatus * process_list_elem = context.getProcessListElement();
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
if (!process_list_elem)
|
|
|
|
return;
|
|
|
|
|
2018-06-13 19:01:07 +00:00
|
|
|
/// Update performance counters before logging to query_log
|
2018-06-19 20:30:35 +00:00
|
|
|
CurrentThread::finalizePerformanceCounters();
|
2018-06-13 19:01:07 +00:00
|
|
|
|
2018-08-27 18:16:32 +00:00
|
|
|
QueryStatusInfo info = process_list_elem->getInfo(true, context.getSettingsRef().log_profile_events);
|
2018-03-09 23:04:26 +00:00
|
|
|
|
|
|
|
double elapsed_seconds = info.elapsed_seconds;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-04-04 21:07:00 +00:00
|
|
|
elem.type = QueryLogElementType::QUERY_FINISH;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-09-15 06:49:02 +00:00
|
|
|
// construct event_time and event_time_microseconds using the same time point
|
|
|
|
// so that the two times will always be equal up to a precision of a second.
|
2020-09-30 17:36:02 +00:00
|
|
|
const auto finish_time = std::chrono::system_clock::now();
|
|
|
|
elem.event_time = time_in_seconds(finish_time);
|
2020-10-01 15:41:48 +00:00
|
|
|
elem.event_time_microseconds = time_in_microseconds(finish_time);
|
Fix gcc10 build by reducing storage of the lambdas in executeQuery
There is no need to capture query AST for the status_info_to_query_log,
since callers already captured it anyway.
gcc10 reports:
../src/Interpreters/executeQuery.cpp: In member function ‘void std::__1::function<_Rp(_ArgTypes ...)>::swap(std::__1::function<_Rp(_ArgTypes ...)>&) [with _Rp = void; _ArgTypes = {DB::IBlockInputStream*, DB::IBlockOutputStream*, DB::QueryPipeline*}]’:
../src/Interpreters/executeQuery.cpp:490:49: error: array subscript 35 is outside array bounds of ‘std::__1::aligned_storage<32, 16>::type [1]’ [-Werror=array-bounds]
490 | auto status_info_to_query_log = [ast](QueryLogElement &element, const QueryStatusInfo &info) mutable
| ^
In file included from ../contrib/libcxx/include/algorithm:644,
from ../contrib/libcxx/include/__string:57,
from ../contrib/libcxx/include/string_view:175,
from ../contrib/libcxx/include/string:504,
from ../src/Common/formatReadable.h:3, from ../src/Interpreters/executeQuery.cpp:1:
../contrib/libcxx/include/functional:1877:60: note: while referencing ‘__tempbuf’
1877 | typename aligned_storage<sizeof(__buf_)>::type __tempbuf;
| ^~~~~~~~~
2020-08-19 18:17:33 +00:00
|
|
|
status_info_to_query_log(elem, info, ast);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2019-04-25 11:25:49 +00:00
|
|
|
auto progress_callback = context.getProgressCallback();
|
2019-05-06 06:57:48 +00:00
|
|
|
|
2019-04-25 11:25:49 +00:00
|
|
|
if (progress_callback)
|
|
|
|
progress_callback(Progress(WriteProgress(info.written_rows, info.written_bytes)));
|
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
if (stream_in)
|
|
|
|
{
|
2019-01-23 14:48:50 +00:00
|
|
|
const BlockStreamProfileInfo & stream_in_info = stream_in->getProfileInfo();
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2019-01-23 14:48:50 +00:00
|
|
|
/// NOTE: INSERT SELECT query contains zero metrics
|
|
|
|
elem.result_rows = stream_in_info.rows;
|
|
|
|
elem.result_bytes = stream_in_info.bytes;
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
else if (stream_out) /// will be used only for ordinary INSERT queries
|
|
|
|
{
|
2020-04-22 06:01:33 +00:00
|
|
|
if (const auto * counting_stream = dynamic_cast<const CountingBlockOutputStream *>(stream_out))
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2019-01-22 19:56:53 +00:00
|
|
|
/// NOTE: Redundancy. The same values could be extracted from process_list_elem->progress_out.query_settings = process_list_elem->progress_in
|
2019-05-20 11:37:41 +00:00
|
|
|
elem.result_rows = counting_stream->getProgress().read_rows;
|
|
|
|
elem.result_bytes = counting_stream->getProgress().read_bytes;
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
}
|
2020-07-02 14:51:10 +00:00
|
|
|
else if (query_pipeline)
|
|
|
|
{
|
|
|
|
if (const auto * output_format = query_pipeline->getOutputFormat())
|
|
|
|
{
|
|
|
|
elem.result_rows = output_format->getResultRows();
|
|
|
|
elem.result_bytes = output_format->getResultBytes();
|
|
|
|
}
|
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
if (elem.read_rows != 0)
|
|
|
|
{
|
2020-05-30 21:57:37 +00:00
|
|
|
LOG_INFO(&Poco::Logger::get("executeQuery"), "Read {} rows, {} in {} sec., {} rows/sec., {}/sec.",
|
2020-05-30 21:35:52 +00:00
|
|
|
elem.read_rows, ReadableSize(elem.read_bytes), elapsed_seconds,
|
2020-05-23 21:41:35 +00:00
|
|
|
static_cast<size_t>(elem.read_rows / elapsed_seconds),
|
2020-05-30 21:35:52 +00:00
|
|
|
ReadableSize(elem.read_bytes / elapsed_seconds));
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
|
2020-02-02 02:27:15 +00:00
|
|
|
elem.thread_ids = std::move(info.thread_ids);
|
2018-05-17 16:01:41 +00:00
|
|
|
elem.profile_counters = std::move(info.profile_counters);
|
|
|
|
|
2020-10-29 19:28:46 +00:00
|
|
|
if (log_queries && elem.type >= log_queries_min_type && Int64(elem.query_duration_ms) >= log_queries_min_query_duration_ms)
|
2018-03-10 19:57:13 +00:00
|
|
|
{
|
|
|
|
if (auto query_log = context.getQueryLog())
|
|
|
|
query_log->add(elem);
|
|
|
|
}
|
2020-08-20 20:59:40 +00:00
|
|
|
|
2020-10-22 16:47:20 +00:00
|
|
|
if (auto opentelemetry_span_log = context.getOpenTelemetrySpanLog();
|
2020-11-18 17:43:18 +00:00
|
|
|
context.query_trace_context.trace_id
|
2020-10-22 16:47:20 +00:00
|
|
|
&& opentelemetry_span_log)
|
2020-08-20 20:59:40 +00:00
|
|
|
{
|
2020-08-27 18:44:20 +00:00
|
|
|
OpenTelemetrySpanLogElement span;
|
2020-11-18 17:43:18 +00:00
|
|
|
span.trace_id = context.query_trace_context.trace_id;
|
|
|
|
span.span_id = context.query_trace_context.span_id;
|
|
|
|
span.parent_span_id = context.getClientInfo().client_trace_context.span_id;
|
2020-08-27 18:44:20 +00:00
|
|
|
span.operation_name = "query";
|
2020-09-30 16:16:33 +00:00
|
|
|
span.start_time_us = elem.query_start_time_microseconds;
|
2020-09-30 17:36:02 +00:00
|
|
|
span.finish_time_us = time_in_microseconds(finish_time);
|
2020-08-27 18:44:20 +00:00
|
|
|
|
2020-11-12 23:27:18 +00:00
|
|
|
/// Keep values synchronized to type enum in QueryLogElement::createBlock.
|
2020-09-08 13:19:27 +00:00
|
|
|
span.attribute_names.push_back("clickhouse.query_status");
|
2020-08-27 18:44:20 +00:00
|
|
|
span.attribute_values.push_back("QueryFinish");
|
|
|
|
|
2020-09-08 13:19:27 +00:00
|
|
|
span.attribute_names.push_back("db.statement");
|
2020-08-27 18:44:20 +00:00
|
|
|
span.attribute_values.push_back(elem.query);
|
|
|
|
|
2020-09-08 13:19:27 +00:00
|
|
|
span.attribute_names.push_back("clickhouse.query_id");
|
2020-08-27 18:44:20 +00:00
|
|
|
span.attribute_values.push_back(elem.client_info.current_query_id);
|
2020-11-18 17:43:18 +00:00
|
|
|
if (!context.query_trace_context.tracestate.empty())
|
2020-08-28 01:21:08 +00:00
|
|
|
{
|
2020-09-08 13:19:27 +00:00
|
|
|
span.attribute_names.push_back("clickhouse.tracestate");
|
2020-08-28 01:21:08 +00:00
|
|
|
span.attribute_values.push_back(
|
2020-11-18 17:43:18 +00:00
|
|
|
context.query_trace_context.tracestate);
|
2020-08-28 01:21:08 +00:00
|
|
|
}
|
2020-08-27 18:44:20 +00:00
|
|
|
|
2020-10-22 16:47:20 +00:00
|
|
|
opentelemetry_span_log->add(span);
|
2020-08-20 20:59:40 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
};
|
|
|
|
|
2020-10-29 19:28:46 +00:00
|
|
|
auto exception_callback = [elem, &context, ast,
|
|
|
|
log_queries,
|
|
|
|
log_queries_min_type = settings.log_queries_min_type,
|
|
|
|
log_queries_min_query_duration_ms = settings.log_queries_min_query_duration_ms.totalMilliseconds(),
|
|
|
|
quota(quota), status_info_to_query_log] () mutable
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2020-03-07 17:37:38 +00:00
|
|
|
if (quota)
|
|
|
|
quota->used(Quota::ERRORS, 1, /* check_exceeded = */ false);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-04-04 21:07:00 +00:00
|
|
|
elem.type = QueryLogElementType::EXCEPTION_WHILE_PROCESSING;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-09-15 06:49:02 +00:00
|
|
|
// event_time and event_time_microseconds are being constructed from the same time point
|
2020-10-27 11:04:03 +00:00
|
|
|
// to ensure that both the times will be equal up to the precision of a second.
|
2020-09-15 06:49:02 +00:00
|
|
|
const auto time_now = std::chrono::system_clock::now();
|
2020-09-15 01:40:06 +00:00
|
|
|
|
2020-09-15 06:49:02 +00:00
|
|
|
elem.event_time = time_in_seconds(time_now);
|
|
|
|
elem.event_time_microseconds = time_in_microseconds(time_now);
|
2017-04-01 07:20:54 +00:00
|
|
|
elem.query_duration_ms = 1000 * (elem.event_time - elem.query_start_time);
|
2020-01-22 12:29:30 +00:00
|
|
|
elem.exception_code = getCurrentExceptionCode();
|
2017-04-01 07:20:54 +00:00
|
|
|
elem.exception = getCurrentExceptionMessage(false);
|
|
|
|
|
2018-02-01 17:55:08 +00:00
|
|
|
QueryStatus * process_list_elem = context.getProcessListElement();
|
2018-08-27 18:16:32 +00:00
|
|
|
const Settings & current_settings = context.getSettingsRef();
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2018-06-13 19:01:07 +00:00
|
|
|
/// Update performance counters before logging to query_log
|
2018-06-19 20:30:35 +00:00
|
|
|
CurrentThread::finalizePerformanceCounters();
|
2018-06-13 19:01:07 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
if (process_list_elem)
|
|
|
|
{
|
2018-08-27 18:16:32 +00:00
|
|
|
QueryStatusInfo info = process_list_elem->getInfo(true, current_settings.log_profile_events, false);
|
Fix gcc10 build by reducing storage of the lambdas in executeQuery
There is no need to capture query AST for the status_info_to_query_log,
since callers already captured it anyway.
gcc10 reports:
../src/Interpreters/executeQuery.cpp: In member function ‘void std::__1::function<_Rp(_ArgTypes ...)>::swap(std::__1::function<_Rp(_ArgTypes ...)>&) [with _Rp = void; _ArgTypes = {DB::IBlockInputStream*, DB::IBlockOutputStream*, DB::QueryPipeline*}]’:
../src/Interpreters/executeQuery.cpp:490:49: error: array subscript 35 is outside array bounds of ‘std::__1::aligned_storage<32, 16>::type [1]’ [-Werror=array-bounds]
490 | auto status_info_to_query_log = [ast](QueryLogElement &element, const QueryStatusInfo &info) mutable
| ^
In file included from ../contrib/libcxx/include/algorithm:644,
from ../contrib/libcxx/include/__string:57,
from ../contrib/libcxx/include/string_view:175,
from ../contrib/libcxx/include/string:504,
from ../src/Common/formatReadable.h:3, from ../src/Interpreters/executeQuery.cpp:1:
../contrib/libcxx/include/functional:1877:60: note: while referencing ‘__tempbuf’
1877 | typename aligned_storage<sizeof(__buf_)>::type __tempbuf;
| ^~~~~~~~~
2020-08-19 18:17:33 +00:00
|
|
|
status_info_to_query_log(elem, info, ast);
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2018-08-27 18:16:32 +00:00
|
|
|
if (current_settings.calculate_text_stack_trace)
|
2018-08-23 01:31:28 +00:00
|
|
|
setExceptionStackTrace(elem);
|
2017-04-01 07:20:54 +00:00
|
|
|
logException(context, elem);
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2018-05-17 16:01:41 +00:00
|
|
|
/// In case of exception we log internal queries also
|
2020-10-29 19:28:46 +00:00
|
|
|
if (log_queries && elem.type >= log_queries_min_type && Int64(elem.query_duration_ms) >= log_queries_min_query_duration_ms)
|
2018-03-10 19:57:13 +00:00
|
|
|
{
|
|
|
|
if (auto query_log = context.getQueryLog())
|
|
|
|
query_log->add(elem);
|
|
|
|
}
|
2020-05-21 18:01:25 +00:00
|
|
|
|
|
|
|
ProfileEvents::increment(ProfileEvents::FailedQuery);
|
2020-05-22 23:37:14 +00:00
|
|
|
if (ast->as<ASTSelectQuery>() || ast->as<ASTSelectWithUnionQuery>())
|
|
|
|
{
|
2020-05-21 18:01:25 +00:00
|
|
|
ProfileEvents::increment(ProfileEvents::FailedSelectQuery);
|
|
|
|
}
|
2020-05-22 23:37:14 +00:00
|
|
|
else if (ast->as<ASTInsertQuery>())
|
|
|
|
{
|
|
|
|
ProfileEvents::increment(ProfileEvents::FailedInsertQuery);
|
|
|
|
}
|
2020-05-21 18:01:25 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
};
|
2015-07-01 05:18:54 +00:00
|
|
|
|
2019-04-05 10:52:07 +00:00
|
|
|
res.finish_callback = std::move(finish_callback);
|
|
|
|
res.exception_callback = std::move(exception_callback);
|
2019-03-26 18:28:37 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
if (!internal && res.in)
|
|
|
|
{
|
2020-11-10 18:22:26 +00:00
|
|
|
WriteBufferFromOwnString msg_buf;
|
|
|
|
res.in->dumpTree(msg_buf);
|
|
|
|
LOG_DEBUG(&Poco::Logger::get("executeQuery"), "Query pipeline:\n{}", msg_buf.str());
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
catch (...)
|
|
|
|
{
|
|
|
|
if (!internal)
|
2019-06-20 07:17:21 +00:00
|
|
|
{
|
|
|
|
if (query_for_logging.empty())
|
|
|
|
query_for_logging = prepareQueryForLogging(query, context);
|
|
|
|
|
2020-09-30 16:16:33 +00:00
|
|
|
onExceptionBeforeStart(query_for_logging, context, time_in_microseconds(current_time), ast);
|
2019-06-20 07:17:21 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
throw;
|
|
|
|
}
|
|
|
|
|
2020-02-27 15:40:11 +00:00
|
|
|
return std::make_tuple(ast, std::move(res));
|
2015-06-18 02:11:05 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
BlockIO executeQuery(
|
2017-04-01 07:20:54 +00:00
|
|
|
const String & query,
|
|
|
|
Context & context,
|
|
|
|
bool internal,
|
2019-02-13 11:57:47 +00:00
|
|
|
QueryProcessingStage::Enum stage,
|
2020-05-18 13:55:07 +00:00
|
|
|
bool may_have_embedded_data)
|
2015-06-18 02:11:05 +00:00
|
|
|
{
|
2019-11-04 03:53:26 +00:00
|
|
|
ASTPtr ast;
|
2017-04-01 07:20:54 +00:00
|
|
|
BlockIO streams;
|
2019-11-04 03:53:26 +00:00
|
|
|
std::tie(ast, streams) = executeQueryImpl(query.data(), query.data() + query.size(), context,
|
2020-05-18 13:55:07 +00:00
|
|
|
internal, stage, !may_have_embedded_data, nullptr);
|
2020-01-23 12:53:32 +00:00
|
|
|
|
|
|
|
if (const auto * ast_query_with_output = dynamic_cast<const ASTQueryWithOutput *>(ast.get()))
|
2019-11-04 03:53:26 +00:00
|
|
|
{
|
2020-01-23 12:59:01 +00:00
|
|
|
String format_name = ast_query_with_output->format
|
|
|
|
? getIdentifierName(ast_query_with_output->format)
|
|
|
|
: context.getDefaultFormat();
|
|
|
|
|
2019-11-04 03:53:26 +00:00
|
|
|
if (format_name == "Null")
|
|
|
|
streams.null_format = true;
|
|
|
|
}
|
2020-01-23 12:53:32 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return streams;
|
2015-06-18 00:27:25 +00:00
|
|
|
}
|
|
|
|
|
2020-05-19 14:06:33 +00:00
|
|
|
BlockIO executeQuery(
|
2020-11-02 19:23:26 +00:00
|
|
|
const String & query,
|
|
|
|
Context & context,
|
|
|
|
bool internal,
|
|
|
|
QueryProcessingStage::Enum stage,
|
|
|
|
bool may_have_embedded_data,
|
|
|
|
bool allow_processors)
|
2020-05-19 14:06:33 +00:00
|
|
|
{
|
2020-05-19 15:40:15 +00:00
|
|
|
BlockIO res = executeQuery(query, context, internal, stage, may_have_embedded_data);
|
2020-05-19 14:06:33 +00:00
|
|
|
|
|
|
|
if (!allow_processors && res.pipeline.initialized())
|
|
|
|
res.in = res.getInputStream();
|
|
|
|
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2015-06-18 00:27:25 +00:00
|
|
|
|
2011-10-30 11:30:52 +00:00
|
|
|
void executeQuery(
|
2017-04-01 07:20:54 +00:00
|
|
|
ReadBuffer & istr,
|
|
|
|
WriteBuffer & ostr,
|
|
|
|
bool allow_into_outfile,
|
|
|
|
Context & context,
|
2020-03-03 15:32:41 +00:00
|
|
|
std::function<void(const String &, const String &, const String &, const String &)> set_result_details)
|
2011-10-30 11:30:52 +00:00
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
PODArray<char> parse_buf;
|
|
|
|
const char * begin;
|
|
|
|
const char * end;
|
|
|
|
|
|
|
|
/// If 'istr' is empty now, fetch next data into buffer.
|
2020-07-31 14:53:41 +00:00
|
|
|
if (!istr.hasPendingData())
|
2017-04-01 07:20:54 +00:00
|
|
|
istr.next();
|
|
|
|
|
|
|
|
size_t max_query_size = context.getSettingsRef().max_query_size;
|
|
|
|
|
2019-02-20 09:22:13 +00:00
|
|
|
bool may_have_tail;
|
2018-03-26 19:41:55 +00:00
|
|
|
if (istr.buffer().end() - istr.position() > static_cast<ssize_t>(max_query_size))
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
|
|
|
/// If remaining buffer space in 'istr' is enough to parse query up to 'max_query_size' bytes, then parse inplace.
|
|
|
|
begin = istr.position();
|
|
|
|
end = istr.buffer().end();
|
|
|
|
istr.position() += end - begin;
|
2019-02-20 09:22:13 +00:00
|
|
|
/// Actually we don't know will query has additional data or not.
|
2020-12-04 02:15:44 +00:00
|
|
|
/// But we can't check istr.eof(), because begin and end pointers will become invalid
|
2019-02-20 09:22:13 +00:00
|
|
|
may_have_tail = true;
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
/// If not - copy enough data into 'parse_buf'.
|
2018-11-30 15:36:41 +00:00
|
|
|
WriteBufferFromVector<PODArray<char>> out(parse_buf);
|
|
|
|
LimitReadBuffer limit(istr, max_query_size + 1, false);
|
|
|
|
copyData(limit, out);
|
2020-01-10 21:42:26 +00:00
|
|
|
out.finalize();
|
2018-11-30 15:36:41 +00:00
|
|
|
|
2018-09-02 03:00:04 +00:00
|
|
|
begin = parse_buf.data();
|
2017-04-01 07:20:54 +00:00
|
|
|
end = begin + parse_buf.size();
|
2019-02-20 09:22:13 +00:00
|
|
|
/// Can check stream for eof, because we have copied data
|
|
|
|
may_have_tail = !istr.eof();
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
ASTPtr ast;
|
|
|
|
BlockIO streams;
|
|
|
|
|
2020-05-18 13:55:07 +00:00
|
|
|
std::tie(ast, streams) = executeQueryImpl(begin, end, context, false, QueryProcessingStage::Complete, may_have_tail, &istr);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2019-03-26 18:28:37 +00:00
|
|
|
auto & pipeline = streams.pipeline;
|
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
try
|
|
|
|
{
|
|
|
|
if (streams.out)
|
|
|
|
{
|
2019-05-30 20:12:44 +00:00
|
|
|
InputStreamFromASTInsertQuery in(ast, &istr, streams.out->getHeader(), context, nullptr);
|
2017-04-01 07:20:54 +00:00
|
|
|
copyData(in, *streams.out);
|
|
|
|
}
|
2020-10-10 01:43:07 +00:00
|
|
|
else if (streams.in)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2019-03-12 12:41:57 +00:00
|
|
|
const auto * ast_query_with_output = dynamic_cast<const ASTQueryWithOutput *>(ast.get());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
WriteBuffer * out_buf = &ostr;
|
2017-11-20 04:15:43 +00:00
|
|
|
std::optional<WriteBufferFromFile> out_file_buf;
|
2017-04-01 07:20:54 +00:00
|
|
|
if (ast_query_with_output && ast_query_with_output->out_file)
|
|
|
|
{
|
|
|
|
if (!allow_into_outfile)
|
|
|
|
throw Exception("INTO OUTFILE is not allowed", ErrorCodes::INTO_OUTFILE_NOT_ALLOWED);
|
|
|
|
|
2019-03-15 16:14:13 +00:00
|
|
|
const auto & out_file = ast_query_with_output->out_file->as<ASTLiteral &>().value.safeGet<std::string>();
|
2017-04-01 07:20:54 +00:00
|
|
|
out_file_buf.emplace(out_file, DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_EXCL | O_CREAT);
|
2017-10-04 00:22:00 +00:00
|
|
|
out_buf = &*out_file_buf;
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
String format_name = ast_query_with_output && (ast_query_with_output->format != nullptr)
|
2019-08-08 20:02:30 +00:00
|
|
|
? getIdentifierName(ast_query_with_output->format)
|
2017-04-01 07:20:54 +00:00
|
|
|
: context.getDefaultFormat();
|
|
|
|
|
2018-01-07 00:35:44 +00:00
|
|
|
BlockOutputStreamPtr out = context.getOutputFormat(format_name, *out_buf, streams.in->getHeader());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2019-01-23 14:48:50 +00:00
|
|
|
/// Save previous progress callback if any. TODO Do it more conveniently.
|
|
|
|
auto previous_progress_callback = context.getProgressCallback();
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2019-01-23 14:48:50 +00:00
|
|
|
/// NOTE Progress callback takes shared ownership of 'out'.
|
|
|
|
streams.in->setProgressCallback([out, previous_progress_callback] (const Progress & progress)
|
|
|
|
{
|
|
|
|
if (previous_progress_callback)
|
|
|
|
previous_progress_callback(progress);
|
|
|
|
out->onProgress(progress);
|
|
|
|
});
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-03-03 15:32:41 +00:00
|
|
|
if (set_result_details)
|
|
|
|
set_result_details(context.getClientInfo().current_query_id, out->getContentType(), format_name, DateLUT::instance().getTimeZone());
|
2019-02-02 12:24:26 +00:00
|
|
|
|
2020-02-02 01:09:49 +00:00
|
|
|
copyData(*streams.in, *out, [](){ return false; }, [&out](const Block &) { out->flush(); });
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
2020-10-10 01:43:07 +00:00
|
|
|
else if (pipeline.initialized())
|
2019-03-26 18:28:37 +00:00
|
|
|
{
|
|
|
|
const ASTQueryWithOutput * ast_query_with_output = dynamic_cast<const ASTQueryWithOutput *>(ast.get());
|
|
|
|
|
|
|
|
WriteBuffer * out_buf = &ostr;
|
|
|
|
std::optional<WriteBufferFromFile> out_file_buf;
|
|
|
|
if (ast_query_with_output && ast_query_with_output->out_file)
|
|
|
|
{
|
|
|
|
if (!allow_into_outfile)
|
|
|
|
throw Exception("INTO OUTFILE is not allowed", ErrorCodes::INTO_OUTFILE_NOT_ALLOWED);
|
|
|
|
|
|
|
|
const auto & out_file = typeid_cast<const ASTLiteral &>(*ast_query_with_output->out_file).value.safeGet<std::string>();
|
|
|
|
out_file_buf.emplace(out_file, DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_EXCL | O_CREAT);
|
|
|
|
out_buf = &*out_file_buf;
|
|
|
|
}
|
|
|
|
|
|
|
|
String format_name = ast_query_with_output && (ast_query_with_output->format != nullptr)
|
2019-08-08 20:02:30 +00:00
|
|
|
? getIdentifierName(ast_query_with_output->format)
|
2019-03-26 18:28:37 +00:00
|
|
|
: context.getDefaultFormat();
|
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
if (!pipeline.isCompleted())
|
2019-04-12 15:32:53 +00:00
|
|
|
{
|
2020-05-27 18:20:26 +00:00
|
|
|
pipeline.addSimpleTransform([](const Block & header)
|
|
|
|
{
|
|
|
|
return std::make_shared<MaterializingTransform>(header);
|
|
|
|
});
|
2019-04-12 15:32:53 +00:00
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
auto out = context.getOutputFormatProcessor(format_name, *out_buf, pipeline.getHeader());
|
|
|
|
out->setAutoFlush();
|
2019-03-26 18:28:37 +00:00
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
/// Save previous progress callback if any. TODO Do it more conveniently.
|
|
|
|
auto previous_progress_callback = context.getProgressCallback();
|
2019-03-26 18:28:37 +00:00
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
/// NOTE Progress callback takes shared ownership of 'out'.
|
|
|
|
pipeline.setProgressCallback([out, previous_progress_callback] (const Progress & progress)
|
|
|
|
{
|
|
|
|
if (previous_progress_callback)
|
|
|
|
previous_progress_callback(progress);
|
|
|
|
out->onProgress(progress);
|
|
|
|
});
|
2019-03-26 18:28:37 +00:00
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
if (set_result_details)
|
|
|
|
set_result_details(context.getClientInfo().current_query_id, out->getContentType(), format_name, DateLUT::instance().getTimeZone());
|
2019-03-26 18:28:37 +00:00
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
pipeline.setOutputFormat(std::move(out));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
pipeline.setProgressCallback(context.getProgressCallback());
|
|
|
|
}
|
2019-04-12 13:56:48 +00:00
|
|
|
|
2019-04-29 13:57:29 +00:00
|
|
|
{
|
2019-05-16 14:57:27 +00:00
|
|
|
auto executor = pipeline.execute();
|
2020-03-15 21:22:55 +00:00
|
|
|
executor->execute(pipeline.getNumThreads());
|
2019-04-29 13:57:29 +00:00
|
|
|
}
|
2019-03-26 18:28:37 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
catch (...)
|
|
|
|
{
|
|
|
|
streams.onException();
|
|
|
|
throw;
|
|
|
|
}
|
|
|
|
|
|
|
|
streams.onFinish();
|
2015-06-18 02:11:05 +00:00
|
|
|
}
|
2012-03-11 08:52:56 +00:00
|
|
|
|
2011-10-30 11:30:52 +00:00
|
|
|
}
|