mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-16 03:12:43 +00:00
ccde92f855
After #40732 it became possible that getrusage() (from detachQuery(), from buildPushingToViewsChain()) will be called for incorrect thread, and so when the difference will be calculated it will be simply garbage. But actually the root of this problem is #25714, after which it became possible to have multiple ThreadStatus for one thread, and this is very tricky (sigh). Here are some other thoughts about it: - Make ThreadStatus nested - decided that complexity does not worth it, at least only for this case - Move some members into ThreadGroupStatus - will break per-thread statistics (and hence query_thread_log, BTW does somebody uses it?) - Move some members into a separate structure But decided to fix the issue w/o any refactoring, to make easy for backport. Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
577 lines
18 KiB
C++
577 lines
18 KiB
C++
#include <mutex>
|
|
#include <Common/ThreadStatus.h>
|
|
|
|
#include <Processors/Transforms/buildPushingToViewsChain.h>
|
|
#include <Interpreters/Context.h>
|
|
#include <Interpreters/OpenTelemetrySpanLog.h>
|
|
#include <Interpreters/ProcessList.h>
|
|
#include <Interpreters/QueryThreadLog.h>
|
|
#include <Interpreters/QueryViewsLog.h>
|
|
#include <Interpreters/TraceCollector.h>
|
|
#include <Parsers/formatAST.h>
|
|
#include <Common/CurrentThread.h>
|
|
#include <Common/Exception.h>
|
|
#include <Common/ProfileEvents.h>
|
|
#include <Common/QueryProfiler.h>
|
|
#include <Common/SensitiveDataMasker.h>
|
|
#include <Common/ThreadProfileEvents.h>
|
|
#include <Common/setThreadName.h>
|
|
#include <Common/noexcept_scope.h>
|
|
#include <Common/DateLUT.h>
|
|
#include <base/errnoToString.h>
|
|
|
|
#if defined(OS_LINUX)
|
|
# include <Common/hasLinuxCapability.h>
|
|
|
|
# include <sys/time.h>
|
|
# include <sys/resource.h>
|
|
#endif
|
|
|
|
|
|
/// Implement some methods of ThreadStatus and CurrentThread here to avoid extra linking dependencies in clickhouse_common_io
|
|
/// TODO It doesn't make sense.
|
|
|
|
namespace DB
|
|
{
|
|
|
|
namespace ErrorCodes
|
|
{
|
|
extern const int LOGICAL_ERROR;
|
|
extern const int CANNOT_SET_THREAD_PRIORITY;
|
|
}
|
|
|
|
void ThreadStatus::applyQuerySettings()
|
|
{
|
|
auto query_context_ptr = query_context.lock();
|
|
assert(query_context_ptr);
|
|
const Settings & settings = query_context_ptr->getSettingsRef();
|
|
|
|
query_id = query_context_ptr->getCurrentQueryId();
|
|
initQueryProfiler();
|
|
|
|
untracked_memory_limit = settings.max_untracked_memory;
|
|
if (settings.memory_profiler_step && settings.memory_profiler_step < static_cast<UInt64>(untracked_memory_limit))
|
|
untracked_memory_limit = settings.memory_profiler_step;
|
|
|
|
#if defined(OS_LINUX)
|
|
/// Set "nice" value if required.
|
|
Int32 new_os_thread_priority = static_cast<Int32>(settings.os_thread_priority);
|
|
if (new_os_thread_priority && hasLinuxCapability(CAP_SYS_NICE))
|
|
{
|
|
LOG_TRACE(log, "Setting nice to {}", new_os_thread_priority);
|
|
|
|
if (0 != setpriority(PRIO_PROCESS, static_cast<unsigned>(thread_id), new_os_thread_priority))
|
|
throwFromErrno("Cannot 'setpriority'", ErrorCodes::CANNOT_SET_THREAD_PRIORITY);
|
|
|
|
os_thread_priority = new_os_thread_priority;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
void ThreadStatus::attachQueryContext(ContextPtr query_context_)
|
|
{
|
|
query_context = query_context_;
|
|
|
|
if (global_context.expired())
|
|
global_context = query_context_->getGlobalContext();
|
|
|
|
if (thread_group)
|
|
{
|
|
std::lock_guard lock(thread_group->mutex);
|
|
|
|
thread_group->query_context = query_context;
|
|
if (thread_group->global_context.expired())
|
|
thread_group->global_context = global_context;
|
|
}
|
|
|
|
applyQuerySettings();
|
|
}
|
|
|
|
void CurrentThread::defaultThreadDeleter()
|
|
{
|
|
if (unlikely(!current_thread))
|
|
return;
|
|
current_thread->detachQuery(true, true);
|
|
}
|
|
|
|
void ThreadStatus::setupState(const ThreadGroupStatusPtr & thread_group_)
|
|
{
|
|
assertState({ThreadState::DetachedFromQuery}, __PRETTY_FUNCTION__);
|
|
|
|
/// Attach or init current thread to thread group and copy useful information from it
|
|
thread_group = thread_group_;
|
|
|
|
performance_counters.setParent(&thread_group->performance_counters);
|
|
memory_tracker.setParent(&thread_group->memory_tracker);
|
|
|
|
{
|
|
std::lock_guard lock(thread_group->mutex);
|
|
|
|
/// NOTE: thread may be attached multiple times if it is reused from a thread pool.
|
|
thread_group->thread_ids.insert(thread_id);
|
|
thread_group->threads.insert(this);
|
|
|
|
logs_queue_ptr = thread_group->logs_queue_ptr;
|
|
fatal_error_callback = thread_group->fatal_error_callback;
|
|
query_context = thread_group->query_context;
|
|
profile_queue_ptr = thread_group->profile_queue_ptr;
|
|
|
|
if (global_context.expired())
|
|
global_context = thread_group->global_context;
|
|
}
|
|
|
|
if (auto query_context_ptr = query_context.lock())
|
|
{
|
|
applyQuerySettings();
|
|
}
|
|
|
|
initPerformanceCounters();
|
|
|
|
thread_state = ThreadState::AttachedToQuery;
|
|
}
|
|
|
|
void ThreadStatus::setInternalThread()
|
|
{
|
|
chassert(!query_profiler_real && !query_profiler_cpu);
|
|
internal_thread = true;
|
|
}
|
|
|
|
void ThreadStatus::initializeQuery()
|
|
{
|
|
setupState(std::make_shared<ThreadGroupStatus>());
|
|
|
|
/// No need to lock on mutex here
|
|
thread_group->memory_tracker.setDescription("(for query)");
|
|
thread_group->master_thread_id = thread_id;
|
|
}
|
|
|
|
void ThreadStatus::attachQuery(const ThreadGroupStatusPtr & thread_group_, bool check_detached)
|
|
{
|
|
if (thread_state == ThreadState::AttachedToQuery)
|
|
{
|
|
if (check_detached)
|
|
throw Exception("Can't attach query to the thread, it is already attached", ErrorCodes::LOGICAL_ERROR);
|
|
return;
|
|
}
|
|
|
|
if (!thread_group_)
|
|
throw Exception("Attempt to attach to nullptr thread group", ErrorCodes::LOGICAL_ERROR);
|
|
|
|
setupState(thread_group_);
|
|
}
|
|
|
|
void ThreadStatus::initPerformanceCounters()
|
|
{
|
|
performance_counters_finalized = false;
|
|
|
|
/// Clear stats from previous query if a new query is started
|
|
/// TODO: make separate query_thread_performance_counters and thread_performance_counters
|
|
performance_counters.resetCounters();
|
|
memory_tracker.resetCounters();
|
|
memory_tracker.setDescription("(for thread)");
|
|
|
|
// query_start_time_{microseconds, nanoseconds} are all constructed from the same time point
|
|
// to ensure that they are all equal up to the precision of a second.
|
|
const auto now = std::chrono::system_clock::now();
|
|
|
|
query_start_time_nanoseconds = timeInNanoseconds(now);
|
|
query_start_time = timeInSeconds(now);
|
|
query_start_time_microseconds = timeInMicroseconds(now);
|
|
++queries_started;
|
|
|
|
// query_start_time_nanoseconds cannot be used here since RUsageCounters expect CLOCK_MONOTONIC
|
|
*last_rusage = RUsageCounters::current();
|
|
|
|
if (!internal_thread)
|
|
{
|
|
if (auto query_context_ptr = query_context.lock())
|
|
{
|
|
const Settings & settings = query_context_ptr->getSettingsRef();
|
|
if (settings.metrics_perf_events_enabled)
|
|
{
|
|
try
|
|
{
|
|
current_thread_counters.initializeProfileEvents(
|
|
settings.metrics_perf_events_list);
|
|
}
|
|
catch (...)
|
|
{
|
|
tryLogCurrentException(__PRETTY_FUNCTION__);
|
|
}
|
|
}
|
|
}
|
|
|
|
if (!taskstats)
|
|
{
|
|
try
|
|
{
|
|
taskstats = TasksStatsCounters::create(thread_id);
|
|
}
|
|
catch (...)
|
|
{
|
|
tryLogCurrentException(log);
|
|
}
|
|
}
|
|
if (taskstats)
|
|
taskstats->reset();
|
|
}
|
|
}
|
|
|
|
void ThreadStatus::finalizePerformanceCounters()
|
|
{
|
|
if (performance_counters_finalized || internal_thread)
|
|
return;
|
|
|
|
performance_counters_finalized = true;
|
|
updatePerformanceCounters();
|
|
|
|
// We want to close perf file descriptors if the perf events were enabled for
|
|
// one query. What this code does in practice is less clear -- e.g., if I run
|
|
// 'select 1 settings metrics_perf_events_enabled = 1', I still get
|
|
// query_context->getSettingsRef().metrics_perf_events_enabled == 0 *shrug*.
|
|
bool close_perf_descriptors = true;
|
|
if (auto query_context_ptr = query_context.lock())
|
|
close_perf_descriptors = !query_context_ptr->getSettingsRef().metrics_perf_events_enabled;
|
|
|
|
try
|
|
{
|
|
current_thread_counters.finalizeProfileEvents(performance_counters);
|
|
if (close_perf_descriptors)
|
|
current_thread_counters.closeEventDescriptors();
|
|
}
|
|
catch (...)
|
|
{
|
|
tryLogCurrentException(log);
|
|
}
|
|
|
|
try
|
|
{
|
|
auto global_context_ptr = global_context.lock();
|
|
auto query_context_ptr = query_context.lock();
|
|
if (global_context_ptr && query_context_ptr)
|
|
{
|
|
const auto & settings = query_context_ptr->getSettingsRef();
|
|
if (settings.log_queries && settings.log_query_threads)
|
|
{
|
|
const auto now = std::chrono::system_clock::now();
|
|
Int64 query_duration_ms = (timeInMicroseconds(now) - query_start_time_microseconds) / 1000;
|
|
if (query_duration_ms >= settings.log_queries_min_query_duration_ms.totalMilliseconds())
|
|
{
|
|
if (auto thread_log = global_context_ptr->getQueryThreadLog())
|
|
logToQueryThreadLog(*thread_log, query_context_ptr->getCurrentDatabase(), now);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
catch (...)
|
|
{
|
|
tryLogCurrentException(log);
|
|
}
|
|
}
|
|
|
|
void ThreadStatus::resetPerformanceCountersLastUsage()
|
|
{
|
|
*last_rusage = RUsageCounters::current();
|
|
if (taskstats)
|
|
taskstats->reset();
|
|
}
|
|
|
|
void ThreadStatus::initQueryProfiler()
|
|
{
|
|
if (internal_thread)
|
|
return;
|
|
|
|
/// query profilers are useless without trace collector
|
|
auto global_context_ptr = global_context.lock();
|
|
if (!global_context_ptr || !global_context_ptr->hasTraceCollector())
|
|
return;
|
|
|
|
auto query_context_ptr = query_context.lock();
|
|
assert(query_context_ptr);
|
|
const auto & settings = query_context_ptr->getSettingsRef();
|
|
|
|
try
|
|
{
|
|
if (settings.query_profiler_real_time_period_ns > 0)
|
|
query_profiler_real = std::make_unique<QueryProfilerReal>(thread_id,
|
|
/* period= */ static_cast<UInt32>(settings.query_profiler_real_time_period_ns));
|
|
|
|
if (settings.query_profiler_cpu_time_period_ns > 0)
|
|
query_profiler_cpu = std::make_unique<QueryProfilerCPU>(thread_id,
|
|
/* period= */ static_cast<UInt32>(settings.query_profiler_cpu_time_period_ns));
|
|
}
|
|
catch (...)
|
|
{
|
|
/// QueryProfiler is optional.
|
|
tryLogCurrentException("ThreadStatus", "Cannot initialize QueryProfiler");
|
|
}
|
|
}
|
|
|
|
void ThreadStatus::finalizeQueryProfiler()
|
|
{
|
|
query_profiler_real.reset();
|
|
query_profiler_cpu.reset();
|
|
}
|
|
|
|
void ThreadStatus::detachQuery(bool exit_if_already_detached, bool thread_exits)
|
|
{
|
|
LockMemoryExceptionInThread lock_memory_tracker(VariableContext::Global);
|
|
|
|
if (exit_if_already_detached && thread_state == ThreadState::DetachedFromQuery)
|
|
{
|
|
thread_state = thread_exits ? ThreadState::Died : ThreadState::DetachedFromQuery;
|
|
return;
|
|
}
|
|
|
|
assertState({ThreadState::AttachedToQuery}, __PRETTY_FUNCTION__);
|
|
|
|
finalizeQueryProfiler();
|
|
finalizePerformanceCounters();
|
|
|
|
/// Detach from thread group
|
|
{
|
|
std::lock_guard guard(thread_group->mutex);
|
|
thread_group->threads.erase(this);
|
|
}
|
|
performance_counters.setParent(&ProfileEvents::global_counters);
|
|
memory_tracker.reset();
|
|
|
|
memory_tracker.setParent(thread_group->memory_tracker.getParent());
|
|
|
|
query_id.clear();
|
|
query_context.reset();
|
|
|
|
/// Avoid leaking of ThreadGroupStatus::finished_threads_counters_memory
|
|
/// (this is in case someone uses system thread but did not call getProfileEventsCountersAndMemoryForThreads())
|
|
{
|
|
std::lock_guard guard(thread_group->mutex);
|
|
auto stats = std::move(thread_group->finished_threads_counters_memory);
|
|
}
|
|
|
|
thread_group.reset();
|
|
|
|
thread_state = thread_exits ? ThreadState::Died : ThreadState::DetachedFromQuery;
|
|
|
|
#if defined(OS_LINUX)
|
|
if (os_thread_priority)
|
|
{
|
|
LOG_TRACE(log, "Resetting nice");
|
|
|
|
if (0 != setpriority(PRIO_PROCESS, static_cast<int>(thread_id), 0))
|
|
LOG_ERROR(log, "Cannot 'setpriority' back to zero: {}", errnoToString());
|
|
|
|
os_thread_priority = 0;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
void ThreadStatus::logToQueryThreadLog(QueryThreadLog & thread_log, const String & current_database, std::chrono::time_point<std::chrono::system_clock> now)
|
|
{
|
|
QueryThreadLogElement elem;
|
|
|
|
// construct current_time and current_time_microseconds using the same time point
|
|
// so that the two times will always be equal up to a precision of a second.
|
|
auto current_time = timeInSeconds(now);
|
|
auto current_time_microseconds = timeInMicroseconds(now);
|
|
|
|
elem.event_time = current_time;
|
|
elem.event_time_microseconds = current_time_microseconds;
|
|
elem.query_start_time = query_start_time;
|
|
elem.query_start_time_microseconds = query_start_time_microseconds;
|
|
elem.query_duration_ms = (timeInNanoseconds(now) - query_start_time_nanoseconds) / 1000000U;
|
|
|
|
elem.read_rows = progress_in.read_rows.load(std::memory_order_relaxed);
|
|
elem.read_bytes = progress_in.read_bytes.load(std::memory_order_relaxed);
|
|
|
|
elem.written_rows = progress_out.written_rows.load(std::memory_order_relaxed);
|
|
elem.written_bytes = progress_out.written_bytes.load(std::memory_order_relaxed);
|
|
elem.memory_usage = memory_tracker.get();
|
|
elem.peak_memory_usage = memory_tracker.getPeak();
|
|
|
|
elem.thread_name = getThreadName();
|
|
elem.thread_id = thread_id;
|
|
|
|
elem.current_database = current_database;
|
|
if (thread_group)
|
|
{
|
|
{
|
|
std::lock_guard lock(thread_group->mutex);
|
|
|
|
elem.master_thread_id = thread_group->master_thread_id;
|
|
elem.query = thread_group->query;
|
|
elem.normalized_query_hash = thread_group->normalized_query_hash;
|
|
}
|
|
}
|
|
|
|
auto query_context_ptr = query_context.lock();
|
|
if (query_context_ptr)
|
|
{
|
|
elem.client_info = query_context_ptr->getClientInfo();
|
|
|
|
if (query_context_ptr->getSettingsRef().log_profile_events != 0)
|
|
{
|
|
/// NOTE: Here we are in the same thread, so we can make memcpy()
|
|
elem.profile_counters = std::make_shared<ProfileEvents::Counters::Snapshot>(performance_counters.getPartiallyAtomicSnapshot());
|
|
}
|
|
}
|
|
|
|
thread_log.add(elem);
|
|
}
|
|
|
|
static String getCleanQueryAst(const ASTPtr q, ContextPtr context)
|
|
{
|
|
String res = serializeAST(*q, true);
|
|
if (auto * masker = SensitiveDataMasker::getInstance())
|
|
masker->wipeSensitiveData(res);
|
|
|
|
res = res.substr(0, context->getSettingsRef().log_queries_cut_to_length);
|
|
|
|
return res;
|
|
}
|
|
|
|
void ThreadStatus::logToQueryViewsLog(const ViewRuntimeData & vinfo)
|
|
{
|
|
auto query_context_ptr = query_context.lock();
|
|
if (!query_context_ptr)
|
|
return;
|
|
auto views_log = query_context_ptr->getQueryViewsLog();
|
|
if (!views_log)
|
|
return;
|
|
|
|
QueryViewsLogElement element;
|
|
|
|
element.event_time = timeInSeconds(vinfo.runtime_stats->event_time);
|
|
element.event_time_microseconds = timeInMicroseconds(vinfo.runtime_stats->event_time);
|
|
element.view_duration_ms = vinfo.runtime_stats->elapsed_ms;
|
|
|
|
element.initial_query_id = query_id;
|
|
element.view_name = vinfo.table_id.getFullTableName();
|
|
element.view_uuid = vinfo.table_id.uuid;
|
|
element.view_type = vinfo.runtime_stats->type;
|
|
if (vinfo.query)
|
|
element.view_query = getCleanQueryAst(vinfo.query, query_context_ptr);
|
|
element.view_target = vinfo.runtime_stats->target_name;
|
|
|
|
auto events = std::make_shared<ProfileEvents::Counters::Snapshot>(performance_counters.getPartiallyAtomicSnapshot());
|
|
element.read_rows = progress_in.read_rows.load(std::memory_order_relaxed);
|
|
element.read_bytes = progress_in.read_bytes.load(std::memory_order_relaxed);
|
|
element.written_rows = progress_out.written_rows.load(std::memory_order_relaxed);
|
|
element.written_bytes = progress_out.written_bytes.load(std::memory_order_relaxed);
|
|
element.peak_memory_usage = memory_tracker.getPeak() > 0 ? memory_tracker.getPeak() : 0;
|
|
if (query_context_ptr->getSettingsRef().log_profile_events != 0)
|
|
{
|
|
element.profile_counters = events;
|
|
}
|
|
|
|
element.status = vinfo.runtime_stats->event_status;
|
|
element.exception_code = 0;
|
|
if (vinfo.exception)
|
|
{
|
|
element.exception_code = getExceptionErrorCode(vinfo.exception);
|
|
element.exception = getExceptionMessage(vinfo.exception, false);
|
|
if (query_context_ptr->getSettingsRef().calculate_text_stack_trace)
|
|
element.stack_trace = getExceptionStackTraceString(vinfo.exception);
|
|
}
|
|
|
|
views_log->add(element);
|
|
}
|
|
|
|
void CurrentThread::initializeQuery()
|
|
{
|
|
if (unlikely(!current_thread))
|
|
return;
|
|
current_thread->initializeQuery();
|
|
current_thread->deleter = CurrentThread::defaultThreadDeleter;
|
|
}
|
|
|
|
void CurrentThread::attachTo(const ThreadGroupStatusPtr & thread_group)
|
|
{
|
|
if (unlikely(!current_thread))
|
|
return;
|
|
current_thread->attachQuery(thread_group, true);
|
|
current_thread->deleter = CurrentThread::defaultThreadDeleter;
|
|
}
|
|
|
|
void CurrentThread::attachToIfDetached(const ThreadGroupStatusPtr & thread_group)
|
|
{
|
|
if (unlikely(!current_thread))
|
|
return;
|
|
current_thread->attachQuery(thread_group, false);
|
|
current_thread->deleter = CurrentThread::defaultThreadDeleter;
|
|
}
|
|
|
|
void CurrentThread::attachQueryContext(ContextPtr query_context)
|
|
{
|
|
if (unlikely(!current_thread))
|
|
return;
|
|
current_thread->attachQueryContext(query_context);
|
|
}
|
|
|
|
void CurrentThread::finalizePerformanceCounters()
|
|
{
|
|
if (unlikely(!current_thread))
|
|
return;
|
|
current_thread->finalizePerformanceCounters();
|
|
}
|
|
|
|
void CurrentThread::detachQuery()
|
|
{
|
|
if (unlikely(!current_thread))
|
|
return;
|
|
current_thread->detachQuery(false);
|
|
}
|
|
|
|
void CurrentThread::detachQueryIfNotDetached()
|
|
{
|
|
if (unlikely(!current_thread))
|
|
return;
|
|
current_thread->detachQuery(true);
|
|
}
|
|
|
|
|
|
CurrentThread::QueryScope::QueryScope(ContextMutablePtr query_context)
|
|
{
|
|
CurrentThread::initializeQuery();
|
|
CurrentThread::attachQueryContext(query_context);
|
|
if (!query_context->hasQueryContext())
|
|
query_context->makeQueryContext();
|
|
}
|
|
|
|
CurrentThread::QueryScope::QueryScope(ContextPtr query_context)
|
|
{
|
|
if (!query_context->hasQueryContext())
|
|
throw Exception(
|
|
ErrorCodes::LOGICAL_ERROR, "Cannot initialize query scope without query context");
|
|
|
|
CurrentThread::initializeQuery();
|
|
CurrentThread::attachQueryContext(query_context);
|
|
}
|
|
|
|
void CurrentThread::QueryScope::logPeakMemoryUsage()
|
|
{
|
|
auto group = CurrentThread::getGroup();
|
|
if (!group)
|
|
return;
|
|
|
|
log_peak_memory_usage_in_destructor = false;
|
|
group->memory_tracker.logPeakMemoryUsage();
|
|
}
|
|
|
|
CurrentThread::QueryScope::~QueryScope()
|
|
{
|
|
try
|
|
{
|
|
if (log_peak_memory_usage_in_destructor)
|
|
logPeakMemoryUsage();
|
|
|
|
CurrentThread::detachQueryIfNotDetached();
|
|
}
|
|
catch (...)
|
|
{
|
|
tryLogCurrentException("CurrentThread", __PRETTY_FUNCTION__);
|
|
}
|
|
}
|
|
|
|
}
|