ClickHouse/dbms/include/DB/Interpreters/ExternalDictionaries.h

128 lines
3.6 KiB
C++
Raw Normal View History

#pragma once
#include <DB/Dictionaries/IDictionary.h>
2015-10-05 01:35:28 +00:00
#include <DB/Common/Exception.h>
#include <DB/Common/setThreadName.h>
2016-07-31 03:53:16 +00:00
#include <DB/Common/randomSeed.h>
2015-09-29 19:19:54 +00:00
#include <common/MultiVersion.h>
#include <common/logger_useful.h>
#include <Poco/Event.h>
#include <unistd.h>
#include <time.h>
#include <mutex>
#include <thread>
#include <unordered_map>
#include <chrono>
#include <random>
namespace DB
{
class Context;
/** Manages user-defined dictionaries.
* Monitors configuration file and automatically reloads dictionaries in a separate thread.
* The monitoring thread wakes up every @check_period_sec seconds and checks
* modification time of dictionaries' configuration file. If said time is greater than
* @config_last_modified, the dictionaries are created from scratch using configuration file,
* possibly overriding currently existing dictionaries with the same name (previous versions of
* overridden dictionaries will live as long as there are any users retaining them).
*
* Apart from checking configuration file for modifications, each non-cached dictionary
* has a lifetime of its own and may be updated if it's source reports that it has been
* modified. The time of next update is calculated by choosing uniformly a random number
* distributed between lifetime.min_sec and lifetime.max_sec.
* If either of lifetime.min_sec and lifetime.max_sec is zero, such dictionary is never updated.
*/
class ExternalDictionaries
{
private:
static const auto check_period_sec = 5;
friend class StorageSystemDictionaries;
mutable std::mutex dictionaries_mutex;
2016-08-07 09:09:18 +00:00
using DictionaryPtr = std::shared_ptr<MultiVersion<IDictionaryBase>>;
struct DictionaryInfo final
{
2016-08-07 09:09:18 +00:00
DictionaryPtr dict;
std::string origin;
std::exception_ptr exception;
};
2016-08-07 09:09:18 +00:00
struct FailedDictionaryInfo final
{
std::unique_ptr<IDictionaryBase> dict;
std::chrono::system_clock::time_point next_attempt_time;
UInt64 error_count;
};
2016-10-18 19:32:32 +00:00
/** name -> dictionary.
*/
2016-08-07 09:09:18 +00:00
std::unordered_map<std::string, DictionaryInfo> dictionaries;
2016-10-18 19:32:32 +00:00
/** Here are dictionaries, that has been never loaded sussessfully.
* They are also in 'dictionaries', but with nullptr as 'dict'.
*/
2016-08-07 09:09:18 +00:00
std::unordered_map<std::string, FailedDictionaryInfo> failed_dictionaries;
2016-10-18 19:32:32 +00:00
/** Both for dictionaries and failed_dictionaries.
*/
std::unordered_map<std::string, std::chrono::system_clock::time_point> update_times;
2016-07-31 03:53:16 +00:00
std::mt19937_64 rnd_engine{randomSeed()};
Context & context;
std::thread reloading_thread;
Poco::Event destroy;
Logger * log;
std::unordered_map<std::string, Poco::Timestamp> last_modification_times;
void reloadImpl(bool throw_on_error = false);
void reloadFromFile(const std::string & config_path, bool throw_on_error);
void reloadPeriodically()
{
setThreadName("ExterDictReload");
while (true)
{
if (destroy.tryWait(check_period_sec * 1000))
return;
reloadImpl();
}
}
public:
2016-10-18 19:32:32 +00:00
/// Dictionaries will be loaded immediately and then will be updated in separate thread, each 'reload_period' seconds.
ExternalDictionaries(Context & context, const bool throw_on_error)
: context(context), log(&Logger::get("ExternalDictionaries"))
{
{
2016-10-18 19:32:32 +00:00
/** During synchronous loading of external dictionaries at moment of query execution,
* we should not use per query memory limit.
*/
TemporarilyDisableMemoryTracker temporarily_disable_memory_tracker;
reloadImpl(throw_on_error);
}
reloading_thread = std::thread{&ExternalDictionaries::reloadPeriodically, this};
}
~ExternalDictionaries()
{
destroy.set();
reloading_thread.join();
}
MultiVersion<IDictionaryBase>::Version getDictionary(const std::string & name) const;
};
}