#pragma once #include #include #include #include #include #include #if defined(__linux__) #include #else struct taskstats {}; #endif /** Implement ProfileEvents with statistics about resource consumption of the current thread. */ namespace ProfileEvents { extern const Event RealTimeMicroseconds; extern const Event UserTimeMicroseconds; extern const Event SystemTimeMicroseconds; extern const Event SoftPageFaults; extern const Event HardPageFaults; extern const Event VoluntaryContextSwitches; extern const Event InvoluntaryContextSwitches; #if defined(__linux__) extern const Event OSIOWaitMicroseconds; extern const Event OSCPUWaitMicroseconds; extern const Event OSCPUVirtualTimeMicroseconds; extern const Event OSReadChars; extern const Event OSWriteChars; extern const Event OSReadBytes; extern const Event OSWriteBytes; extern const Event PerfCpuCycles; extern const Event PerfInstructions; extern const Event PerfCacheReferences; extern const Event PerfCacheMisses; extern const Event PerfBranchInstructions; extern const Event PerfBranchMisses; extern const Event PerfBusCycles; extern const Event PerfStalledCyclesFrontend; extern const Event PerfStalledCyclesBackend; extern const Event PerfRefCpuCycles; extern const Event PerfCpuClock; extern const Event PerfTaskClock; extern const Event PerfContextSwitches; extern const Event PerfCpuMigrations; extern const Event PerfAlignmentFaults; extern const Event PerfEmulationFaults; extern const Event PerfMinEnabledTime; extern const Event PerfMinEnabledRunningTime; extern const Event PerfDataTLBReferences; extern const Event PerfDataTLBMisses; extern const Event PerfInstructionTLBReferences; extern const Event PerfInstructionTLBMisses; extern const Event PerfLocalMemoryReferences; extern const Event PerfLocalMemoryMisses; #endif } namespace DB { /// Handles overflow template inline TUInt safeDiff(TUInt prev, TUInt curr) { return curr >= prev ? curr - prev : 0; } inline UInt64 getCurrentTimeNanoseconds(clockid_t clock_type = CLOCK_MONOTONIC) { struct timespec ts; clock_gettime(clock_type, &ts); return ts.tv_sec * 1000000000ULL + ts.tv_nsec; } inline UInt64 getCurrentTimeMicroseconds() { struct timeval tv; gettimeofday(&tv, nullptr); return (tv.tv_sec) * 1000000U + (tv.tv_usec); } struct RUsageCounters { /// In nanoseconds UInt64 real_time = 0; UInt64 user_time = 0; UInt64 sys_time = 0; UInt64 soft_page_faults = 0; UInt64 hard_page_faults = 0; RUsageCounters() = default; RUsageCounters(const ::rusage & rusage_, UInt64 real_time_) { set(rusage_, real_time_); } void set(const ::rusage & rusage, UInt64 real_time_) { real_time = real_time_; user_time = rusage.ru_utime.tv_sec * 1000000000UL + rusage.ru_utime.tv_usec * 1000UL; sys_time = rusage.ru_stime.tv_sec * 1000000000UL + rusage.ru_stime.tv_usec * 1000UL; soft_page_faults = static_cast(rusage.ru_minflt); hard_page_faults = static_cast(rusage.ru_majflt); } static RUsageCounters zeros(UInt64 real_time_ = getCurrentTimeNanoseconds()) { RUsageCounters res; res.real_time = real_time_; return res; } static RUsageCounters current(UInt64 real_time_ = getCurrentTimeNanoseconds()) { ::rusage rusage {}; #if !defined(__APPLE__) ::getrusage(RUSAGE_THREAD, &rusage); #endif return RUsageCounters(rusage, real_time_); } static void incrementProfileEvents(const RUsageCounters & prev, const RUsageCounters & curr, ProfileEvents::Counters & profile_events) { profile_events.increment(ProfileEvents::RealTimeMicroseconds, (curr.real_time - prev.real_time) / 1000U); profile_events.increment(ProfileEvents::UserTimeMicroseconds, (curr.user_time - prev.user_time) / 1000U); profile_events.increment(ProfileEvents::SystemTimeMicroseconds, (curr.sys_time - prev.sys_time) / 1000U); profile_events.increment(ProfileEvents::SoftPageFaults, curr.soft_page_faults - prev.soft_page_faults); profile_events.increment(ProfileEvents::HardPageFaults, curr.hard_page_faults - prev.hard_page_faults); } static void updateProfileEvents(RUsageCounters & last_counters, ProfileEvents::Counters & profile_events) { auto current_counters = current(); incrementProfileEvents(last_counters, current_counters, profile_events); last_counters = current_counters; } }; // thread_local is disabled in Arcadia, so we have to use a dummy implementation // there. #if defined(__linux__) && !defined(ARCADIA_BUILD) struct PerfEventInfo { // see perf_event.h/perf_type_id enum int event_type; // see configs in perf_event.h int event_config; ProfileEvents::Event profile_event; std::string settings_name; }; struct PerfEventValue { UInt64 value = 0; UInt64 time_enabled = 0; UInt64 time_running = 0; }; static constexpr size_t NUMBER_OF_RAW_EVENTS = 22; struct PerfDescriptorsHolder : boost::noncopyable { int descriptors[NUMBER_OF_RAW_EVENTS]{}; PerfDescriptorsHolder(); ~PerfDescriptorsHolder(); void releaseResources(); }; struct PerfEventsCounters { PerfDescriptorsHolder thread_events_descriptors_holder; // time_enabled and time_running can't be reset, so we have to store the // data from the previous profiling period and calculate deltas to them, // to be able to properly account for counter multiplexing. PerfEventValue previous_values[NUMBER_OF_RAW_EVENTS]{}; void initializeProfileEvents(const std::string & events_list); void finalizeProfileEvents(ProfileEvents::Counters & profile_events); void closeEventDescriptors(); bool processThreadLocalChanges(const std::string & needed_events_list); static std::vector eventIndicesFromString(const std::string & events_list); }; // Perf event creation is moderately heavy, so we create them once per thread and // then reuse. extern thread_local PerfEventsCounters current_thread_counters; #else // Not on Linux, or in Arcadia: the functionality is disabled. struct PerfEventsCounters { void initializeProfileEvents(const std::string & /* events_list */) {} void finalizeProfileEvents(ProfileEvents::Counters & /* profile_events */) {} void closeEventDescriptors() {} }; // thread_local is disabled in Arcadia, so we are going to use a static dummy. extern PerfEventsCounters current_thread_counters; #endif #if defined(__linux__) class TasksStatsCounters { public: static bool checkIfAvailable(); static std::unique_ptr create(const UInt64 tid); void reset(); void updateCounters(ProfileEvents::Counters & profile_events); private: ::taskstats stats; //-V730_NOINIT std::function<::taskstats()> stats_getter; enum class MetricsProvider { None, Procfs, Netlink }; private: explicit TasksStatsCounters(const UInt64 tid, const MetricsProvider provider); static MetricsProvider findBestAvailableProvider(); static void incrementProfileEvents(const ::taskstats & prev, const ::taskstats & curr, ProfileEvents::Counters & profile_events); }; #else class TasksStatsCounters { public: static bool checkIfAvailable() { return false; } static std::unique_ptr create(const UInt64 /*tid*/) { return {}; } void reset() {} void updateCounters(ProfileEvents::Counters &) {} private: TasksStatsCounters(const UInt64 /*tid*/) {} }; #endif }