ClickHouse/src/Storages/MergeTree/BackgroundProcessingPool.h

166 lines
4.8 KiB
C++
Raw Normal View History

2014-04-11 13:05:17 +00:00
#pragma once
#include <thread>
#include <set>
#include <map>
2014-07-03 08:51:11 +00:00
#include <list>
#include <condition_variable>
#include <mutex>
#include <shared_mutex>
#include <atomic>
2017-09-18 18:52:12 +00:00
#include <functional>
2014-07-03 08:51:11 +00:00
#include <Poco/Event.h>
2016-10-14 02:51:03 +00:00
#include <Poco/Timestamp.h>
2020-09-15 09:55:57 +00:00
#include <common/types.h>
#include <Common/CurrentMetrics.h>
#include <Common/CurrentThread.h>
#include <Common/ThreadPool.h>
#include <Poco/Util/AbstractConfiguration.h>
namespace CurrentMetrics
{
extern const Metric BackgroundPoolTask;
extern const Metric MemoryTrackingInBackgroundProcessingPool;
}
2014-04-11 13:05:17 +00:00
namespace DB
{
class BackgroundProcessingPool;
class BackgroundProcessingPoolTaskInfo;
2018-12-26 17:03:29 +00:00
enum class BackgroundProcessingPoolTaskResult
{
SUCCESS,
ERROR,
NOTHING_TO_DO,
};
2019-04-06 00:36:04 +00:00
2017-04-16 15:00:33 +00:00
/** Using a fixed number of threads, perform an arbitrary number of tasks in an infinite loop.
* In this case, one task can run simultaneously from different threads.
* Designed for tasks that perform continuous background work (for example, merge).
* `Task` is a function that returns a bool - did it do any work.
* If not, then the next time will be done later.
2014-04-11 13:05:17 +00:00
*/
class BackgroundProcessingPool
{
public:
/// Returns true, if some useful work was done. In that case, thread will not sleep before next run of this task.
2018-12-26 17:03:29 +00:00
using TaskResult = BackgroundProcessingPoolTaskResult;
using Task = std::function<TaskResult()>;
using TaskInfo = BackgroundProcessingPoolTaskInfo;
using TaskHandle = std::shared_ptr<TaskInfo>;
2014-07-03 08:51:11 +00:00
2014-04-11 13:05:17 +00:00
2019-12-05 08:05:07 +00:00
struct PoolSettings
{
double thread_sleep_seconds = 10;
double thread_sleep_seconds_random_part = 1.0;
double thread_sleep_seconds_if_nothing_to_do = 0.1;
/// For exponential backoff.
double task_sleep_seconds_when_no_work_min = 10;
double task_sleep_seconds_when_no_work_max = 600;
double task_sleep_seconds_when_no_work_multiplier = 1.1;
double task_sleep_seconds_when_no_work_random_part = 1.0;
CurrentMetrics::Metric tasks_metric = CurrentMetrics::BackgroundPoolTask;
CurrentMetrics::Metric memory_metric = CurrentMetrics::MemoryTrackingInBackgroundProcessingPool;
2019-12-05 08:05:07 +00:00
PoolSettings() noexcept {}
};
2019-11-17 21:00:10 +00:00
BackgroundProcessingPool(int size_,
2019-12-05 08:05:07 +00:00
const PoolSettings & pool_settings = {},
2019-11-17 21:00:10 +00:00
const char * log_name = "BackgroundProcessingPool",
const char * thread_name_ = "BackgrProcPool");
2014-04-11 13:05:17 +00:00
size_t getNumberOfThreads() const
{
return size;
}
2014-04-11 13:05:17 +00:00
2020-06-02 15:22:05 +00:00
/// Create task and start it.
TaskHandle addTask(const Task & task);
/// The following two methods are invoked by Storage*MergeTree at startup
/// Create task but not start it.
TaskHandle createTask(const Task & task);
/// Start the task that was created but not started. Precondition: task was not started.
void startTask(const TaskHandle & task, bool allow_execute_in_parallel = true);
/// Invoked by Storage*MergeTree at shutdown
void removeTask(const TaskHandle & task);
2014-04-11 13:05:17 +00:00
~BackgroundProcessingPool();
2014-04-11 13:05:17 +00:00
protected:
friend class BackgroundProcessingPoolTaskInfo;
using Tasks = std::multimap<Poco::Timestamp, TaskHandle>; /// key is desired next time to execute (priority).
using Threads = std::vector<ThreadFromGlobalPool>;
2014-04-11 13:05:17 +00:00
const size_t size;
const char * thread_name;
Poco::Logger * logger;
Tasks tasks; /// Ordered in priority.
std::mutex tasks_mutex;
2016-09-01 02:26:45 +00:00
Threads threads;
bool shutdown{false};
std::condition_variable wake_event;
2014-04-11 13:05:17 +00:00
/// Thread group used for profiling purposes
ThreadGroupStatusPtr thread_group;
void workLoopFunc();
void rescheduleTask(Tasks::iterator & task_it, const Poco::Timestamp & new_scheduled_ts)
{
auto node_handle = tasks.extract(task_it);
node_handle.key() = new_scheduled_ts;
task_it = tasks.insert(std::move(node_handle));
}
private:
2019-12-05 08:05:07 +00:00
PoolSettings settings;
2014-04-11 13:05:17 +00:00
};
class BackgroundProcessingPoolTaskInfo
{
public:
/// Signals random idle thread from the pool that this task is ready to be executed.
2020-06-02 15:18:36 +00:00
void signalReadyToRun();
BackgroundProcessingPoolTaskInfo(BackgroundProcessingPool & pool_, const BackgroundProcessingPool::Task & function_)
: pool(pool_), task_function(function_) {}
protected:
friend class BackgroundProcessingPool;
BackgroundProcessingPool & pool;
BackgroundProcessingPool::Task task_function;
/// Read lock is held while task is being executed.
/// Write lock is used for stopping BGProcPool
std::shared_mutex rwlock;
bool allow_execute_in_parallel = false;
size_t concurrent_executors = 0;
/// Signals that this task must no longer be planned for execution and is about to be removed
std::atomic<bool> removed {false};
BackgroundProcessingPool::Tasks::iterator iterator;
/// For exponential backoff.
size_t count_no_work_done = 0;
};
2014-04-11 13:05:17 +00:00
}