mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-11-19 22:22:00 +00:00
143 lines
4.4 KiB
C++
143 lines
4.4 KiB
C++
#include <DB/Storages/StorageSet.h>
|
||
#include <DB/IO/ReadBufferFromFile.h>
|
||
#include <DB/IO/CompressedReadBuffer.h>
|
||
#include <DB/DataStreams/NativeBlockInputStream.h>
|
||
#include <DB/Common/escapeForFileName.h>
|
||
#include <Poco/DirectoryIterator.h>
|
||
|
||
|
||
namespace DB
|
||
{
|
||
|
||
|
||
SetOrJoinBlockOutputStream::SetOrJoinBlockOutputStream(StorageSetOrJoinBase & table_,
|
||
const String & backup_path_, const String & backup_tmp_path_, const String & backup_file_name_)
|
||
: table(table_),
|
||
backup_path(backup_path_), backup_tmp_path(backup_tmp_path_),
|
||
backup_file_name(backup_file_name_),
|
||
backup_buf(backup_tmp_path + backup_file_name),
|
||
compressed_backup_buf(backup_buf),
|
||
backup_stream(compressed_backup_buf)
|
||
{
|
||
}
|
||
|
||
void SetOrJoinBlockOutputStream::write(const Block & block)
|
||
{
|
||
/// Сортируем столбцы в блоке. Это нужно, так как Set и Join рассчитывают на одинаковый порядок столбцов в разных блоках.
|
||
Block sorted_block = block.sortColumns();
|
||
|
||
table.insertBlock(sorted_block);
|
||
backup_stream.write(sorted_block);
|
||
}
|
||
|
||
void SetOrJoinBlockOutputStream::writeSuffix()
|
||
{
|
||
backup_stream.flush();
|
||
compressed_backup_buf.next();
|
||
backup_buf.next();
|
||
|
||
Poco::File(backup_tmp_path + backup_file_name).renameTo(backup_path + backup_file_name);
|
||
}
|
||
|
||
|
||
|
||
BlockOutputStreamPtr StorageSetOrJoinBase::write(ASTPtr query, const Settings & settings)
|
||
{
|
||
++increment;
|
||
return new SetOrJoinBlockOutputStream(*this, path, path + "tmp/", toString(increment) + ".bin");
|
||
}
|
||
|
||
|
||
StorageSetOrJoinBase::StorageSetOrJoinBase(
|
||
const String & path_,
|
||
const String & name_,
|
||
NamesAndTypesListPtr columns_,
|
||
const NamesAndTypesList & materialized_columns_,
|
||
const NamesAndTypesList & alias_columns_,
|
||
const ColumnDefaults & column_defaults_)
|
||
: IStorage{materialized_columns_, alias_columns_, column_defaults_},
|
||
path(path_ + escapeForFileName(name_) + '/'), name(name_), columns(columns_)
|
||
{
|
||
}
|
||
|
||
|
||
|
||
StorageSet::StorageSet(
|
||
const String & path_,
|
||
const String & name_,
|
||
NamesAndTypesListPtr columns_,
|
||
const NamesAndTypesList & materialized_columns_,
|
||
const NamesAndTypesList & alias_columns_,
|
||
const ColumnDefaults & column_defaults_)
|
||
: StorageSetOrJoinBase{path_, name_, columns_, materialized_columns_, alias_columns_, column_defaults_}
|
||
{
|
||
restore();
|
||
}
|
||
|
||
|
||
void StorageSetOrJoinBase::restore()
|
||
{
|
||
Poco::File tmp_dir(path + "tmp/");
|
||
if (!tmp_dir.exists())
|
||
{
|
||
tmp_dir.createDirectories();
|
||
return;
|
||
}
|
||
|
||
constexpr auto file_suffix = ".bin";
|
||
constexpr auto file_suffix_size = strlen(file_suffix);
|
||
|
||
Poco::DirectoryIterator dir_end;
|
||
for (Poco::DirectoryIterator dir_it(path); dir_end != dir_it; ++dir_it)
|
||
{
|
||
const auto & name = dir_it.name();
|
||
|
||
if (dir_it->isFile()
|
||
&& name.size() > file_suffix_size
|
||
&& 0 == name.compare(name.size() - file_suffix_size, file_suffix_size, file_suffix)
|
||
&& dir_it->getSize() > 0)
|
||
{
|
||
/// Вычисляем максимальный номер имеющихся файлов с бэкапом, чтобы добавлять следующие файлы с большими номерами.
|
||
UInt64 file_num = parse<UInt64>(name.substr(0, name.size() - file_suffix_size));
|
||
if (file_num > increment)
|
||
increment = file_num;
|
||
|
||
restoreFromFile(dir_it->path());
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
void StorageSetOrJoinBase::restoreFromFile(const String & file_path)
|
||
{
|
||
ReadBufferFromFile backup_buf(file_path);
|
||
CompressedReadBuffer compressed_backup_buf(backup_buf);
|
||
NativeBlockInputStream backup_stream(compressed_backup_buf);
|
||
|
||
backup_stream.readPrefix();
|
||
while (Block block = backup_stream.read())
|
||
insertBlock(block);
|
||
backup_stream.readSuffix();
|
||
|
||
/// TODO Добавить скорость, сжатые байты, объём данных в памяти, коэффициент сжатия... Обобщить всё логгирование статистики в проекте.
|
||
LOG_INFO(&Logger::get("StorageSetOrJoinBase"), std::fixed << std::setprecision(2)
|
||
<< "Loaded from backup file " << file_path << ". "
|
||
<< backup_stream.getInfo().rows << " rows, "
|
||
<< backup_stream.getInfo().bytes / 1048576.0 << " MiB. "
|
||
<< "State has " << getSize() << " unique rows.");
|
||
}
|
||
|
||
|
||
void StorageSetOrJoinBase::rename(const String & new_path_to_db, const String & new_database_name, const String & new_table_name)
|
||
{
|
||
/// Переименовываем директорию с данными.
|
||
String new_path = new_path_to_db + escapeForFileName(new_table_name);
|
||
Poco::File(path).renameTo(new_path);
|
||
|
||
path = new_path + "/";
|
||
name = new_table_name;
|
||
}
|
||
|
||
|
||
}
|