mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-11-16 12:44:42 +00:00
e623ad041f
C-z is extermelly useful for some users (like myself), so provide a way to configure it in client and avoid it's ignorance in clickhouse-disks (I hope it is OK since it is not that known utility and it does not have it's own configuration, while cli option is useless, one should remeber about it). Honestly I've never seen any interactive client that forbids C-z, so ignoring it my default looks strange to me. Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
263 lines
6.8 KiB
C++
263 lines
6.8 KiB
C++
#include "DisksClient.h"
|
|
#include <Client/ClientBase.h>
|
|
#include <Disks/registerDisks.h>
|
|
#include <Common/Config/ConfigProcessor.h>
|
|
|
|
#include <Formats/registerFormats.h>
|
|
|
|
namespace ErrorCodes
|
|
{
|
|
extern const int BAD_ARGUMENTS;
|
|
extern const int LOGICAL_ERROR;
|
|
};
|
|
|
|
namespace DB
|
|
{
|
|
DiskWithPath::DiskWithPath(DiskPtr disk_, std::optional<String> path_) : disk(disk_)
|
|
{
|
|
if (path_.has_value())
|
|
{
|
|
if (!fs::path{path_.value()}.is_absolute())
|
|
{
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "Initializing path {} is not absolute", path_.value());
|
|
}
|
|
path = path_.value();
|
|
}
|
|
else
|
|
{
|
|
path = String{"/"};
|
|
}
|
|
|
|
String relative_path = normalizePathAndGetAsRelative(path);
|
|
if (disk->isDirectory(relative_path) || (relative_path.empty() && (disk->isDirectory("/"))))
|
|
{
|
|
return;
|
|
}
|
|
throw Exception(
|
|
ErrorCodes::BAD_ARGUMENTS,
|
|
"Initializing path {} (normalized path: {}) at disk {} is not a directory",
|
|
path,
|
|
relative_path,
|
|
disk->getName());
|
|
}
|
|
|
|
std::vector<String> DiskWithPath::listAllFilesByPath(const String & any_path) const
|
|
{
|
|
if (isDirectory(any_path))
|
|
{
|
|
std::vector<String> file_names;
|
|
disk->listFiles(getRelativeFromRoot(any_path), file_names);
|
|
return file_names;
|
|
}
|
|
else
|
|
{
|
|
return {};
|
|
}
|
|
}
|
|
|
|
std::vector<String> DiskWithPath::getAllFilesByPattern(const String & pattern) const
|
|
{
|
|
auto [path_before, path_after] = [&]() -> std::pair<String, String>
|
|
{
|
|
auto slash_pos = pattern.find_last_of('/');
|
|
if (slash_pos >= pattern.size())
|
|
{
|
|
return {"", pattern};
|
|
}
|
|
else
|
|
{
|
|
return {pattern.substr(0, slash_pos + 1), pattern.substr(slash_pos + 1, pattern.size() - slash_pos - 1)};
|
|
}
|
|
}();
|
|
|
|
if (!isDirectory(path_before))
|
|
{
|
|
return {};
|
|
}
|
|
else
|
|
{
|
|
std::vector<String> file_names = listAllFilesByPath(path_before);
|
|
|
|
std::vector<String> answer;
|
|
|
|
for (const auto & file_name : file_names)
|
|
{
|
|
if (file_name.starts_with(path_after))
|
|
{
|
|
String file_pattern = path_before + file_name;
|
|
if (isDirectory(file_pattern))
|
|
{
|
|
file_pattern = file_pattern + "/";
|
|
}
|
|
answer.push_back(file_pattern);
|
|
}
|
|
}
|
|
return answer;
|
|
}
|
|
};
|
|
|
|
void DiskWithPath::setPath(const String & any_path)
|
|
{
|
|
if (isDirectory(any_path))
|
|
{
|
|
path = getAbsolutePath(any_path);
|
|
}
|
|
else
|
|
{
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "Path {} at disk {} is not a directory", any_path, disk->getName());
|
|
}
|
|
}
|
|
|
|
String DiskWithPath::validatePathAndGetAsRelative(const String & path)
|
|
{
|
|
String lexically_normal_path = fs::path(path).lexically_normal();
|
|
if (lexically_normal_path.find("..") != std::string::npos)
|
|
throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Path {} is not normalized", path);
|
|
|
|
/// If path is absolute we should keep it as relative inside disk, so disk will look like
|
|
/// an ordinary filesystem with root.
|
|
if (fs::path(lexically_normal_path).is_absolute())
|
|
return lexically_normal_path.substr(1);
|
|
|
|
return lexically_normal_path;
|
|
}
|
|
|
|
String DiskWithPath::normalizePathAndGetAsRelative(const String & messyPath)
|
|
{
|
|
std::filesystem::path path(messyPath);
|
|
std::filesystem::path canonical_path = std::filesystem::weakly_canonical(path);
|
|
String npath = canonical_path.make_preferred().string();
|
|
return validatePathAndGetAsRelative(npath);
|
|
}
|
|
|
|
String DiskWithPath::normalizePath(const String & path)
|
|
{
|
|
std::filesystem::path canonical_path = std::filesystem::weakly_canonical(path);
|
|
return canonical_path.make_preferred().string();
|
|
}
|
|
|
|
DisksClient::DisksClient(std::vector<std::pair<DiskPtr, std::optional<String>>> && disks_with_paths, std::optional<String> begin_disk)
|
|
{
|
|
if (disks_with_paths.empty())
|
|
{
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "Initializing array of disks is empty");
|
|
}
|
|
if (!begin_disk.has_value())
|
|
{
|
|
begin_disk = disks_with_paths[0].first->getName();
|
|
}
|
|
bool has_begin_disk = false;
|
|
for (auto & [disk, path] : disks_with_paths)
|
|
{
|
|
addDisk(disk, path);
|
|
if (disk->getName() == begin_disk.value())
|
|
{
|
|
has_begin_disk = true;
|
|
}
|
|
}
|
|
if (!has_begin_disk)
|
|
{
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "There is no begin_disk '{}' in initializing array", begin_disk.value());
|
|
}
|
|
current_disk = std::move(begin_disk.value());
|
|
}
|
|
|
|
const DiskWithPath & DisksClient::getDiskWithPath(const String & disk) const
|
|
{
|
|
try
|
|
{
|
|
return disks.at(disk);
|
|
}
|
|
catch (...)
|
|
{
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "The disk '{}' is unknown", disk);
|
|
}
|
|
}
|
|
|
|
DiskWithPath & DisksClient::getDiskWithPath(const String & disk)
|
|
{
|
|
try
|
|
{
|
|
return disks.at(disk);
|
|
}
|
|
catch (...)
|
|
{
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "The disk '{}' is unknown", disk);
|
|
}
|
|
}
|
|
|
|
const DiskWithPath & DisksClient::getCurrentDiskWithPath() const
|
|
{
|
|
try
|
|
{
|
|
return disks.at(current_disk);
|
|
}
|
|
catch (...)
|
|
{
|
|
throw Exception(ErrorCodes::LOGICAL_ERROR, "There is no current disk in client");
|
|
}
|
|
}
|
|
|
|
DiskWithPath & DisksClient::getCurrentDiskWithPath()
|
|
{
|
|
try
|
|
{
|
|
return disks.at(current_disk);
|
|
}
|
|
catch (...)
|
|
{
|
|
throw Exception(ErrorCodes::LOGICAL_ERROR, "There is no current disk in client");
|
|
}
|
|
}
|
|
|
|
void DisksClient::switchToDisk(const String & disk_, const std::optional<String> & path_)
|
|
{
|
|
if (disks.contains(disk_))
|
|
{
|
|
if (path_.has_value())
|
|
{
|
|
disks.at(disk_).setPath(path_.value());
|
|
}
|
|
current_disk = disk_;
|
|
}
|
|
else
|
|
{
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "The disk '{}' is unknown", disk_);
|
|
}
|
|
}
|
|
|
|
std::vector<String> DisksClient::getAllDiskNames() const
|
|
{
|
|
std::vector<String> answer{};
|
|
answer.reserve(disks.size());
|
|
for (const auto & [disk_name, _] : disks)
|
|
{
|
|
answer.push_back(disk_name);
|
|
}
|
|
return answer;
|
|
}
|
|
|
|
std::vector<String> DisksClient::getAllFilesByPatternFromAllDisks(const String & pattern) const
|
|
{
|
|
std::vector<String> answer{};
|
|
for (const auto & [_, disk] : disks)
|
|
{
|
|
for (auto & word : disk.getAllFilesByPattern(pattern))
|
|
{
|
|
answer.push_back(word);
|
|
}
|
|
}
|
|
return answer;
|
|
}
|
|
|
|
void DisksClient::addDisk(DiskPtr disk_, const std::optional<String> & path_)
|
|
{
|
|
String disk_name = disk_->getName();
|
|
if (disks.contains(disk_->getName()))
|
|
{
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "The disk '{}' already exists", disk_name);
|
|
}
|
|
disks.emplace(disk_name, DiskWithPath{disk_, path_});
|
|
}
|
|
}
|