ClickHouse/libs/libcommon/src/DateLUT.cpp

125 lines
4.2 KiB
C++
Raw Normal View History

2015-09-29 19:19:54 +00:00
#include <common/DateLUT.h>
#include <boost/filesystem.hpp>
#include <Poco/Exception.h>
#include <Poco/SHA1Engine.h>
#include <Poco/DigestStream.h>
#include <fstream>
namespace
{
2009-05-28 18:19:51 +00:00
Poco::DigestEngine::Digest calcSHA1(const std::string & path)
{
std::ifstream stream(path);
if (!stream)
2019-07-01 19:55:35 +00:00
throw Poco::Exception("Error while opening file: '" + path + "'.");
Poco::SHA1Engine digest_engine;
Poco::DigestInputStream digest_stream(digest_engine, stream);
digest_stream.ignore(std::numeric_limits<std::streamsize>::max());
if (!stream.eof())
2019-07-01 19:55:35 +00:00
throw Poco::Exception("Error while reading file: '" + path + "'.");
return digest_engine.digest();
}
std::string determineDefaultTimeZone()
2009-05-28 18:19:51 +00:00
{
namespace fs = boost::filesystem;
const char * tzdir_env_var = std::getenv("TZDIR");
fs::path tz_database_path = tzdir_env_var ? tzdir_env_var : "/usr/share/zoneinfo/";
fs::path tz_file_path;
std::string error_prefix;
const char * tz_env_var = std::getenv("TZ");
/// In recent tzdata packages some files now are symlinks and canonical path resolution
/// may give wrong timezone names - store the name as it is, if possible.
std::string tz_name;
if (tz_env_var)
{
2019-07-01 19:55:35 +00:00
error_prefix = std::string("Could not determine time zone from TZ variable value: '") + tz_env_var + "': ";
if (*tz_env_var == ':')
++tz_env_var;
tz_file_path = tz_env_var;
tz_name = tz_env_var;
}
else
{
error_prefix = "Could not determine local time zone: ";
tz_file_path = "/etc/localtime"; /// FIXME: in case of no TZ use the immediate linked file as tz name.
}
try
{
tz_database_path = fs::canonical(tz_database_path);
tz_file_path = fs::canonical(tz_file_path, tz_database_path);
/// The tzdata file exists. If it is inside the tz_database_dir,
/// then the relative path is the time zone id.
fs::path relative_path = tz_file_path.lexically_relative(tz_database_path);
if (!relative_path.empty() && *relative_path.begin() != ".." && *relative_path.begin() != ".")
return tz_name.empty() ? relative_path.string() : tz_name;
/// The file is not inside the tz_database_dir, so we hope that it was copied and
/// try to find the file with exact same contents in the database.
size_t tzfile_size = fs::file_size(tz_file_path);
Poco::SHA1Engine::Digest tzfile_sha1 = calcSHA1(tz_file_path.string());
fs::recursive_directory_iterator begin(tz_database_path);
fs::recursive_directory_iterator end;
for (auto candidate_it = begin; candidate_it != end; ++candidate_it)
{
const auto & path = candidate_it->path();
if (path.filename() == "posix" || path.filename() == "right")
{
/// Some timezone databases contain copies of toplevel tzdata files in the posix/ directory
/// and tzdata files with leap seconds in the right/ directory. Skip them.
candidate_it.no_push();
continue;
}
if (candidate_it->status().type() != fs::regular_file || path.filename() == "localtime")
continue;
if (fs::file_size(path) == tzfile_size && calcSHA1(path.string()) == tzfile_sha1)
return path.lexically_relative(tz_database_path).string();
}
}
catch (const Poco::Exception & ex)
{
throw Poco::Exception(error_prefix + ex.message(), ex);
}
catch (const std::exception & ex)
{
throw Poco::Exception(error_prefix + ex.what());
}
throw Poco::Exception(error_prefix + "custom time zone file used.");
}
}
DateLUT::DateLUT()
{
/// Initialize the pointer to the default DateLUTImpl.
std::string default_time_zone = determineDefaultTimeZone();
default_impl.store(&getImplementation(default_time_zone), std::memory_order_release);
2009-05-28 18:19:51 +00:00
}
const DateLUTImpl & DateLUT::getImplementation(const std::string & time_zone) const
{
std::lock_guard<std::mutex> lock(mutex);
auto it = impls.emplace(time_zone, nullptr).first;
if (!it->second)
it->second = std::make_unique<DateLUTImpl>(time_zone);
return *it->second;
}