#pragma once #include #include #include #include #include #include #include #include #include #include #include #include namespace Poco { class Logger; } namespace DB { class ReadBuffer; struct AsynchronousMetricValue { double value; const char * documentation; template AsynchronousMetricValue(T value_, const char * documentation_) : value(static_cast(value_)), documentation(documentation_) {} AsynchronousMetricValue() = default; /// For std::unordered_map::operator[]. }; using AsynchronousMetricValues = std::unordered_map; struct ProtocolServerMetrics { String port_name; size_t current_threads; }; /** Periodically (by default, each minute, starting at 30 seconds offset) * calculates and updates some metrics, * that are not updated automatically (so, need to be asynchronously calculated). * * This includes both ClickHouse-related metrics (like memory usage of ClickHouse process) * and common OS-related metrics (like total memory usage on the server). * * All the values are either gauge type (like the total number of tables, the current memory usage). * Or delta-counters representing some accumulation during the interval of time. */ class AsynchronousMetrics { public: using ProtocolServerMetricsFunc = std::function()>; AsynchronousMetrics( int update_period_seconds, const ProtocolServerMetricsFunc & protocol_server_metrics_func_); virtual ~AsynchronousMetrics(); /// Separate method allows to initialize the `servers` variable beforehand. void start(); void stop(); /// Returns copy of all values. AsynchronousMetricValues getValues() const; protected: using Duration = std::chrono::seconds; using TimePoint = std::chrono::system_clock::time_point; const Duration update_period; /// Some values are incremental and we have to calculate the difference. /// On first run we will only collect the values to subtract later. bool first_run = true; TimePoint previous_update_time; Poco::Logger * log; private: virtual void updateImpl(AsynchronousMetricValues & new_values, TimePoint update_time, TimePoint current_time) = 0; virtual void logImpl(AsynchronousMetricValues &) {} ProtocolServerMetricsFunc protocol_server_metrics_func; mutable std::mutex mutex; std::condition_variable wait_cond; bool quit {false}; AsynchronousMetricValues values; #if defined(OS_LINUX) || defined(OS_FREEBSD) MemoryStatisticsOS memory_stat; #endif #if defined(OS_LINUX) std::optional meminfo; std::optional loadavg; std::optional proc_stat; std::optional cpuinfo; std::optional file_nr; std::optional uptime; std::optional net_dev; std::optional cgroupmem_limit_in_bytes; std::optional cgroupmem_usage_in_bytes; std::vector> thermal; std::unordered_map>> hwmon_devices; std::vector /* correctable errors */, std::unique_ptr /* uncorrectable errors */>> edac; std::unordered_map> block_devs; /// TODO: socket statistics. struct ProcStatValuesCPU { uint64_t user; uint64_t nice; uint64_t system; uint64_t idle; uint64_t iowait; uint64_t irq; uint64_t softirq; uint64_t steal; uint64_t guest; uint64_t guest_nice; void read(ReadBuffer & in); ProcStatValuesCPU operator-(const ProcStatValuesCPU & other) const; }; struct ProcStatValuesOther { uint64_t interrupts; uint64_t context_switches; uint64_t processes_created; ProcStatValuesOther operator-(const ProcStatValuesOther & other) const; }; ProcStatValuesCPU proc_stat_values_all_cpus{}; ProcStatValuesOther proc_stat_values_other{}; std::vector proc_stat_values_per_cpu; /// https://www.kernel.org/doc/Documentation/block/stat.txt struct BlockDeviceStatValues { uint64_t read_ios; uint64_t read_merges; uint64_t read_sectors; uint64_t read_ticks; uint64_t write_ios; uint64_t write_merges; uint64_t write_sectors; uint64_t write_ticks; uint64_t in_flight_ios; uint64_t io_ticks; uint64_t time_in_queue; uint64_t discard_ops; uint64_t discard_merges; uint64_t discard_sectors; uint64_t discard_ticks; void read(ReadBuffer & in); BlockDeviceStatValues operator-(const BlockDeviceStatValues & other) const; }; std::unordered_map block_device_stats; struct NetworkInterfaceStatValues { uint64_t recv_bytes; uint64_t recv_packets; uint64_t recv_errors; uint64_t recv_drop; uint64_t send_bytes; uint64_t send_packets; uint64_t send_errors; uint64_t send_drop; NetworkInterfaceStatValues operator-(const NetworkInterfaceStatValues & other) const; }; std::unordered_map network_interface_stats; Stopwatch block_devices_rescan_delay; void openSensors(); void openBlockDevices(); void openSensorsChips(); void openEDAC(); #endif std::unique_ptr thread; void run(); void update(TimePoint update_time); }; }