2023-01-25 17:34:09 +00:00
# include <Storages/MergeTree/DataPartStorageOnDiskBase.h>
2022-04-05 19:12:48 +00:00
# include <Storages/MergeTree/MergeTreeDataPartChecksum.h>
2022-04-19 19:34:41 +00:00
# include <Disks/TemporaryFileOnDisk.h>
2022-04-05 19:12:48 +00:00
# include <IO/WriteBufferFromFileBase.h>
2023-01-25 17:34:09 +00:00
# include <IO/ReadBufferFromString.h>
2022-05-03 15:48:05 +00:00
# include <IO/ReadHelpers.h>
2022-05-03 17:58:47 +00:00
# include <Common/logger_useful.h>
2023-01-25 17:34:09 +00:00
# include <Storages/MergeTree/localBackup.h>
2022-04-19 19:34:41 +00:00
# include <Backups/BackupEntryFromSmallFile.h>
# include <Backups/BackupEntryFromImmutableFile.h>
# include <Disks/SingleDiskVolume.h>
2022-04-05 19:12:48 +00:00
namespace DB
{
2022-04-07 11:58:38 +00:00
namespace ErrorCodes
{
extern const int DIRECTORY_ALREADY_EXISTS ;
2022-04-12 18:59:49 +00:00
extern const int NOT_ENOUGH_SPACE ;
2022-05-05 09:23:23 +00:00
extern const int LOGICAL_ERROR ;
2022-09-26 14:33:25 +00:00
extern const int FILE_DOESNT_EXIST ;
2023-01-25 17:34:09 +00:00
extern const int CORRUPTED_DATA ;
2022-04-07 11:58:38 +00:00
}
2023-01-25 17:34:09 +00:00
DataPartStorageOnDiskBase : : DataPartStorageOnDiskBase ( VolumePtr volume_ , std : : string root_path_ , std : : string part_dir_ )
2022-04-12 18:59:49 +00:00
: volume ( std : : move ( volume_ ) ) , root_path ( std : : move ( root_path_ ) ) , part_dir ( std : : move ( part_dir_ ) )
2022-05-05 09:19:12 +00:00
{
2022-04-05 19:12:48 +00:00
}
2023-01-25 17:34:09 +00:00
DataPartStorageOnDiskBase : : DataPartStorageOnDiskBase (
2022-10-24 15:08:51 +00:00
VolumePtr volume_ , std : : string root_path_ , std : : string part_dir_ , DiskTransactionPtr transaction_ )
: volume ( std : : move ( volume_ ) )
, root_path ( std : : move ( root_path_ ) )
, part_dir ( std : : move ( part_dir_ ) )
, transaction ( std : : move ( transaction_ ) )
, has_shared_transaction ( transaction ! = nullptr )
{
}
2023-01-25 17:34:09 +00:00
DiskPtr DataPartStorageOnDiskBase : : getDisk ( ) const
2022-04-05 19:12:48 +00:00
{
2023-01-25 17:34:09 +00:00
return volume - > getDisk ( ) ;
2022-04-05 19:12:48 +00:00
}
2023-01-25 17:34:09 +00:00
std : : string DataPartStorageOnDiskBase : : getFullPath ( ) const
2022-04-19 19:34:41 +00:00
{
2023-01-25 17:34:09 +00:00
return fs : : path ( volume - > getDisk ( ) - > getPath ( ) ) / root_path / part_dir / " " ;
2022-04-19 19:34:41 +00:00
}
2023-01-25 17:34:09 +00:00
std : : string DataPartStorageOnDiskBase : : getRelativePath ( ) const
2022-04-19 19:34:41 +00:00
{
2023-01-25 17:34:09 +00:00
return fs : : path ( root_path ) / part_dir / " " ;
2022-04-19 19:34:41 +00:00
}
2023-01-25 17:34:09 +00:00
std : : optional < String > DataPartStorageOnDiskBase : : getRelativePathForPrefix ( Poco : : Logger * log , const String & prefix , bool detached , bool broken ) const
2022-04-22 16:58:09 +00:00
{
2022-10-18 16:13:18 +00:00
assert ( ! broken | | detached ) ;
2022-06-20 18:18:17 +00:00
String res ;
2022-04-22 16:58:09 +00:00
2022-06-20 18:18:17 +00:00
auto full_relative_path = fs : : path ( root_path ) ;
if ( detached )
full_relative_path / = " detached " ;
2022-09-30 18:09:18 +00:00
std : : optional < String > original_checksums_content ;
std : : optional < Strings > original_files_list ;
2022-06-20 18:18:17 +00:00
for ( int try_no = 0 ; try_no < 10 ; + + try_no )
{
2022-10-03 15:56:09 +00:00
if ( prefix . empty ( ) )
res = part_dir + ( try_no ? " _try " + DB : : toString ( try_no ) : " " ) ;
else if ( prefix . ends_with ( " _ " ) )
res = prefix + part_dir + ( try_no ? " _try " + DB : : toString ( try_no ) : " " ) ;
else
res = prefix + " _ " + part_dir + ( try_no ? " _try " + DB : : toString ( try_no ) : " " ) ;
2022-06-20 18:18:17 +00:00
if ( ! volume - > getDisk ( ) - > exists ( full_relative_path / res ) )
return res ;
2023-01-25 17:34:09 +00:00
/// If part with compacted storage is broken then we probably
/// cannot read the single file with data and check its content.
if ( broken
& & isFullPartStorage ( * this )
& & looksLikeBrokenDetachedPartHasTheSameContent ( res , original_checksums_content , original_files_list ) )
2022-09-30 18:09:18 +00:00
{
LOG_WARNING ( log , " Directory {} (to detach to) already exists, "
" but its content looks similar to content of the broken part which we are going to detach. "
" Assuming it was already cloned to detached, will not do it again to avoid redundant copies of broken part. " , res ) ;
return { } ;
}
2022-06-20 18:18:17 +00:00
LOG_WARNING ( log , " Directory {} (to detach to) already exists. Will detach to directory with '_tryN' suffix. " , res ) ;
}
return res ;
2022-04-05 19:12:48 +00:00
}
2023-01-25 17:34:09 +00:00
bool DataPartStorageOnDiskBase : : looksLikeBrokenDetachedPartHasTheSameContent ( const String & detached_part_path ,
2022-09-30 18:09:18 +00:00
std : : optional < String > & original_checksums_content ,
std : : optional < Strings > & original_files_list ) const
{
/// We cannot know for sure that content of detached part is the same,
/// but in most cases it's enough to compare checksums.txt and list of files.
if ( ! exists ( " checksums.txt " ) )
return false ;
2023-01-25 17:34:09 +00:00
auto storage_from_detached = create ( volume , fs : : path ( root_path ) / " detached " , detached_part_path , /*initialize=*/ true ) ;
if ( ! storage_from_detached - > exists ( " checksums.txt " ) )
2022-09-30 18:09:18 +00:00
return false ;
if ( ! original_checksums_content )
{
2023-01-25 17:34:09 +00:00
auto in = storage_from_detached - > readFile ( " checksums.txt " , /* settings */ { } , /* read_hint */ { } , /* file_size */ { } ) ;
2022-09-30 18:09:18 +00:00
original_checksums_content . emplace ( ) ;
readStringUntilEOF ( * original_checksums_content , * in ) ;
}
if ( original_checksums_content - > empty ( ) )
return false ;
String detached_checksums_content ;
{
auto in = readFile ( " checksums.txt " , /* settings */ { } , /* read_hint */ { } , /* file_size */ { } ) ;
readStringUntilEOF ( detached_checksums_content , * in ) ;
}
if ( original_checksums_content ! = detached_checksums_content )
return false ;
if ( ! original_files_list )
{
original_files_list . emplace ( ) ;
2023-01-25 17:34:09 +00:00
for ( auto it = iterate ( ) ; it - > isValid ( ) ; it - > next ( ) )
original_files_list - > emplace_back ( it - > name ( ) ) ;
2022-09-30 18:09:18 +00:00
std : : sort ( original_files_list - > begin ( ) , original_files_list - > end ( ) ) ;
}
Strings detached_files_list ;
2023-01-25 17:34:09 +00:00
for ( auto it = storage_from_detached - > iterate ( ) ; it - > isValid ( ) ; it - > next ( ) )
detached_files_list . emplace_back ( it - > name ( ) ) ;
2022-09-30 18:09:18 +00:00
std : : sort ( detached_files_list . begin ( ) , detached_files_list . end ( ) ) ;
return original_files_list = = detached_files_list ;
}
2023-01-25 17:34:09 +00:00
void DataPartStorageOnDiskBase : : setRelativePath ( const std : : string & path )
{
part_dir = path ;
}
std : : string DataPartStorageOnDiskBase : : getPartDirectory ( ) const
{
return part_dir ;
}
std : : string DataPartStorageOnDiskBase : : getFullRootPath ( ) const
{
return fs : : path ( volume - > getDisk ( ) - > getPath ( ) ) / root_path / " " ;
}
Poco : : Timestamp DataPartStorageOnDiskBase : : getLastModified ( ) const
{
return volume - > getDisk ( ) - > getLastModified ( fs : : path ( root_path ) / part_dir ) ;
}
static UInt64 calculateTotalSizeOnDiskImpl ( const DiskPtr & disk , const String & from )
{
if ( disk - > isFile ( from ) )
return disk - > getFileSize ( from ) ;
std : : vector < std : : string > files ;
disk - > listFiles ( from , files ) ;
UInt64 res = 0 ;
for ( const auto & file : files )
res + = calculateTotalSizeOnDiskImpl ( disk , fs : : path ( from ) / file ) ;
return res ;
}
UInt64 DataPartStorageOnDiskBase : : calculateTotalSizeOnDisk ( ) const
{
return calculateTotalSizeOnDiskImpl ( volume - > getDisk ( ) , fs : : path ( root_path ) / part_dir ) ;
}
std : : string DataPartStorageOnDiskBase : : getDiskName ( ) const
2022-04-05 19:12:48 +00:00
{
2022-06-20 18:18:17 +00:00
return volume - > getDisk ( ) - > getName ( ) ;
2022-04-05 19:12:48 +00:00
}
2023-01-25 17:34:09 +00:00
std : : string DataPartStorageOnDiskBase : : getDiskType ( ) const
2022-04-05 19:12:48 +00:00
{
2022-08-19 14:58:30 +00:00
return toString ( volume - > getDisk ( ) - > getDataSourceDescription ( ) . type ) ;
2022-04-05 19:12:48 +00:00
}
2023-01-25 17:34:09 +00:00
bool DataPartStorageOnDiskBase : : isStoredOnRemoteDisk ( ) const
2022-04-08 18:56:08 +00:00
{
return volume - > getDisk ( ) - > isRemote ( ) ;
}
2023-01-25 17:34:09 +00:00
bool DataPartStorageOnDiskBase : : supportZeroCopyReplication ( ) const
2022-04-08 18:56:08 +00:00
{
return volume - > getDisk ( ) - > supportZeroCopyReplication ( ) ;
}
2023-01-25 17:34:09 +00:00
bool DataPartStorageOnDiskBase : : supportParallelWrite ( ) const
2022-04-22 16:58:09 +00:00
{
return volume - > getDisk ( ) - > supportParallelWrite ( ) ;
}
2023-01-25 17:34:09 +00:00
bool DataPartStorageOnDiskBase : : isBroken ( ) const
2022-04-19 19:34:41 +00:00
{
return volume - > getDisk ( ) - > isBroken ( ) ;
}
2023-01-25 17:34:09 +00:00
void DataPartStorageOnDiskBase : : syncRevision ( UInt64 revision ) const
2022-06-20 18:18:17 +00:00
{
volume - > getDisk ( ) - > syncRevision ( revision ) ;
}
2023-01-25 17:34:09 +00:00
UInt64 DataPartStorageOnDiskBase : : getRevision ( ) const
2022-06-20 18:18:17 +00:00
{
return volume - > getDisk ( ) - > getRevision ( ) ;
}
2023-01-25 17:34:09 +00:00
std : : string DataPartStorageOnDiskBase : : getDiskPath ( ) const
2022-04-19 19:34:41 +00:00
{
return volume - > getDisk ( ) - > getPath ( ) ;
}
2023-01-25 17:34:09 +00:00
ReservationPtr DataPartStorageOnDiskBase : : reserve ( UInt64 bytes ) const
2022-06-20 18:18:17 +00:00
{
auto res = volume - > reserve ( bytes ) ;
if ( ! res )
throw Exception ( ErrorCodes : : NOT_ENOUGH_SPACE , " Cannot reserve {}, not enough space " , ReadableSize ( bytes ) ) ;
return res ;
}
2023-01-25 17:34:09 +00:00
ReservationPtr DataPartStorageOnDiskBase : : tryReserve ( UInt64 bytes ) const
{
return volume - > reserve ( bytes ) ;
}
IDataPartStorage : : ReplicatedFilesDescription
DataPartStorageOnDiskBase : : getReplicatedFilesDescription ( const NameSet & file_names ) const
{
ReplicatedFilesDescription description ;
auto relative_path = fs : : path ( root_path ) / part_dir ;
auto disk = volume - > getDisk ( ) ;
auto actual_file_names = getActualFileNamesOnDisk ( file_names ) ;
for ( const auto & name : actual_file_names )
{
auto path = relative_path / name ;
size_t file_size = disk - > getFileSize ( path ) ;
auto & file_desc = description . files [ name ] ;
file_desc . file_size = file_size ;
file_desc . input_buffer_getter = [ disk , path , file_size ]
{
return disk - > readFile ( path , ReadSettings { } . adjustBufferSize ( file_size ) , file_size , file_size ) ;
} ;
}
return description ;
2022-06-20 18:18:17 +00:00
}
2023-01-25 17:34:09 +00:00
IDataPartStorage : : ReplicatedFilesDescription
DataPartStorageOnDiskBase : : getReplicatedFilesDescriptionForRemoteDisk ( const NameSet & file_names ) const
2022-05-05 09:19:12 +00:00
{
2023-01-25 17:34:09 +00:00
ReplicatedFilesDescription description ;
auto relative_path = fs : : path ( root_path ) / part_dir ;
2022-06-21 07:26:43 +00:00
auto disk = volume - > getDisk ( ) ;
if ( ! disk - > supportZeroCopyReplication ( ) )
2023-01-23 21:13:58 +00:00
throw Exception ( ErrorCodes : : LOGICAL_ERROR , " Disk {} doesn't support zero-copy replication " , disk - > getName ( ) ) ;
2022-06-21 07:26:43 +00:00
2023-01-25 17:34:09 +00:00
description . unique_id = getUniqueId ( ) ;
Names paths ;
auto actual_file_names = getActualFileNamesOnDisk ( file_names ) ;
for ( const auto & name : actual_file_names )
{
/// Just some additional checks
auto metadata_full_file_path = fs : : path ( getFullPath ( ) ) / name ;
if ( ! fs : : exists ( metadata_full_file_path ) )
throw Exception ( ErrorCodes : : CORRUPTED_DATA , " Remote metadata '{}' is not exists " , name ) ;
if ( ! fs : : is_regular_file ( metadata_full_file_path ) )
throw Exception ( ErrorCodes : : CORRUPTED_DATA , " Remote metadata '{}' is not a file " , name ) ;
paths . emplace_back ( relative_path / name ) ;
}
auto serialized_metadata = disk - > getSerializedMetadata ( paths ) ;
for ( const auto & name : actual_file_names )
{
auto & file_desc = description . files [ name ] ;
const auto & metadata_str = serialized_metadata . at ( relative_path / name ) ;
file_desc . file_size = metadata_str . size ( ) ;
file_desc . input_buffer_getter = [ metadata_str ]
{
return std : : make_unique < ReadBufferFromString > ( metadata_str ) ;
} ;
}
return description ;
2022-05-05 09:19:12 +00:00
}
2023-01-25 17:34:09 +00:00
void DataPartStorageOnDiskBase : : backup (
2022-04-19 19:34:41 +00:00
const MergeTreeDataPartChecksums & checksums ,
const NameSet & files_without_checksums ,
2022-06-22 20:30:50 +00:00
const String & path_in_backup ,
2022-09-06 23:58:03 +00:00
BackupEntries & backup_entries ,
bool make_temporary_hard_links ,
TemporaryFilesOnDisks * temp_dirs ) const
2022-04-19 19:34:41 +00:00
{
2022-06-22 20:30:50 +00:00
fs : : path part_path_on_disk = fs : : path { root_path } / part_dir ;
fs : : path part_path_in_backup = fs : : path { path_in_backup } / part_dir ;
2022-04-19 19:34:41 +00:00
2022-06-22 20:30:50 +00:00
auto disk = volume - > getDisk ( ) ;
2022-09-06 23:58:03 +00:00
fs : : path temp_part_dir ;
std : : shared_ptr < TemporaryFileOnDisk > temp_dir_owner ;
if ( make_temporary_hard_links )
{
assert ( temp_dirs ) ;
auto temp_dir_it = temp_dirs - > find ( disk ) ;
if ( temp_dir_it = = temp_dirs - > end ( ) )
temp_dir_it = temp_dirs - > emplace ( disk , std : : make_shared < TemporaryFileOnDisk > ( disk , " tmp/ " ) ) . first ;
2023-01-25 17:34:09 +00:00
2022-09-06 23:58:03 +00:00
temp_dir_owner = temp_dir_it - > second ;
fs : : path temp_dir = temp_dir_owner - > getPath ( ) ;
temp_part_dir = temp_dir / part_path_in_backup . relative_path ( ) ;
disk - > createDirectories ( temp_part_dir ) ;
}
2022-04-19 19:34:41 +00:00
2022-06-22 20:30:50 +00:00
/// For example,
/// part_path_in_backup = /data/test/table/0_1_1_0
/// part_path_on_disk = store/f57/f5728353-44bb-4575-85e8-28deb893657a/0_1_1_0
2022-07-03 14:32:11 +00:00
/// tmp_part_dir = tmp/1aaaaaa/data/test/table/0_1_1_0
2022-06-22 20:30:50 +00:00
/// Or, for projections:
/// part_path_in_backup = /data/test/table/0_1_1_0/prjmax.proj
/// part_path_on_disk = store/f57/f5728353-44bb-4575-85e8-28deb893657a/0_1_1_0/prjmax.proj
2022-07-03 14:32:11 +00:00
/// tmp_part_dir = tmp/1aaaaaa/data/test/table/0_1_1_0/prjmax.proj
2022-06-22 20:30:50 +00:00
2023-01-25 17:34:09 +00:00
auto files_to_backup = files_without_checksums ;
for ( const auto & [ name , _ ] : checksums . files )
{
if ( ! name . ends_with ( " .proj " ) )
files_to_backup . insert ( name ) ;
}
files_to_backup = getActualFileNamesOnDisk ( files_to_backup ) ;
for ( const auto & filepath : files_to_backup )
2022-04-19 19:34:41 +00:00
{
2023-01-25 17:34:09 +00:00
auto filepath_on_disk = part_path_on_disk / filepath ;
auto filepath_in_backup = part_path_in_backup / filepath ;
if ( files_without_checksums . contains ( filepath ) )
{
backup_entries . emplace_back ( filepath_in_backup , std : : make_unique < BackupEntryFromSmallFile > ( disk , filepath_on_disk ) ) ;
continue ;
}
2022-06-30 08:10:12 +00:00
2022-09-06 23:58:03 +00:00
if ( make_temporary_hard_links )
{
String hardlink_filepath = temp_part_dir / filepath ;
disk - > createHardLink ( filepath_on_disk , hardlink_filepath ) ;
filepath_on_disk = hardlink_filepath ;
}
2023-01-25 17:34:09 +00:00
std : : optional < UInt64 > file_size ;
std : : optional < UInt128 > file_hash ;
auto it = checksums . files . find ( filepath ) ;
if ( it ! = checksums . files . end ( ) )
{
file_size = it - > second . file_size ;
file_hash = { it - > second . file_hash . first , it - > second . file_hash . second } ;
}
2022-04-19 19:34:41 +00:00
backup_entries . emplace_back (
2022-06-22 20:30:50 +00:00
filepath_in_backup ,
2023-01-25 17:34:09 +00:00
std : : make_unique < BackupEntryFromImmutableFile > ( disk , filepath_on_disk , file_size , file_hash , temp_dir_owner ) ) ;
2022-04-19 19:34:41 +00:00
}
}
2023-01-25 17:34:09 +00:00
MutableDataPartStoragePtr DataPartStorageOnDiskBase : : freeze (
2022-05-05 09:19:12 +00:00
const std : : string & to ,
2022-04-19 19:34:41 +00:00
const std : : string & dir_path ,
2022-05-03 15:48:05 +00:00
bool make_source_readonly ,
std : : function < void ( const DiskPtr & ) > save_metadata_callback ,
2022-09-27 13:50:25 +00:00
bool copy_instead_of_hardlink ,
const NameSet & files_to_copy_instead_of_hardlinks ) const
2022-04-19 19:34:41 +00:00
{
auto disk = volume - > getDisk ( ) ;
disk - > createDirectories ( to ) ;
2022-09-27 13:50:25 +00:00
localBackup ( disk , getRelativePath ( ) , fs : : path ( to ) / dir_path , make_source_readonly , { } , copy_instead_of_hardlink , files_to_copy_instead_of_hardlinks ) ;
2022-04-19 19:34:41 +00:00
if ( save_metadata_callback )
save_metadata_callback ( disk ) ;
disk - > removeFileIfExists ( fs : : path ( to ) / dir_path / " delete-on-destroy.txt " ) ;
2022-05-03 15:48:05 +00:00
disk - > removeFileIfExists ( fs : : path ( to ) / dir_path / " txn_version.txt " ) ;
2022-04-19 19:34:41 +00:00
auto single_disk_volume = std : : make_shared < SingleDiskVolume > ( disk - > getName ( ) , disk , 0 ) ;
2023-01-25 17:34:09 +00:00
/// Do not initialize storage in case of DETACH because part may be broken.
bool to_detached = dir_path . starts_with ( " detached/ " ) ;
return create ( single_disk_volume , to , dir_path , /*initialize=*/ ! to_detached ) ;
2022-04-19 19:34:41 +00:00
}
2023-01-25 17:34:09 +00:00
MutableDataPartStoragePtr DataPartStorageOnDiskBase : : clonePart (
2022-04-19 19:34:41 +00:00
const std : : string & to ,
const std : : string & dir_path ,
2022-06-15 11:41:08 +00:00
const DiskPtr & disk ,
2022-04-19 19:34:41 +00:00
Poco : : Logger * log ) const
{
String path_to_clone = fs : : path ( to ) / dir_path / " " ;
if ( disk - > exists ( path_to_clone ) )
{
LOG_WARNING ( log , " Path {} already exists. Will remove it and clone again. " , fullPath ( disk , path_to_clone ) ) ;
disk - > removeRecursive ( path_to_clone ) ;
}
2022-10-22 22:51:59 +00:00
2022-04-19 19:34:41 +00:00
disk - > createDirectories ( to ) ;
2022-06-20 18:18:17 +00:00
volume - > getDisk ( ) - > copy ( getRelativePath ( ) , disk , to ) ;
2022-04-19 19:34:41 +00:00
volume - > getDisk ( ) - > removeFileIfExists ( fs : : path ( path_to_clone ) / " delete-on-destroy.txt " ) ;
auto single_disk_volume = std : : make_shared < SingleDiskVolume > ( disk - > getName ( ) , disk , 0 ) ;
2023-01-25 17:34:09 +00:00
return create ( single_disk_volume , to , dir_path , /*initialize=*/ true ) ;
2022-04-19 19:34:41 +00:00
}
2023-01-25 17:34:09 +00:00
void DataPartStorageOnDiskBase : : rename (
2022-12-22 13:31:42 +00:00
std : : string new_root_path ,
std : : string new_part_dir ,
2022-06-26 16:43:28 +00:00
Poco : : Logger * log ,
bool remove_new_dir_if_exists ,
bool fsync_part_dir )
2022-06-20 18:18:17 +00:00
{
2022-12-22 13:31:42 +00:00
if ( new_root_path . ends_with ( ' / ' ) )
new_root_path . pop_back ( ) ;
if ( new_part_dir . ends_with ( ' / ' ) )
new_part_dir . pop_back ( ) ;
2022-06-20 18:18:17 +00:00
String to = fs : : path ( new_root_path ) / new_part_dir / " " ;
if ( volume - > getDisk ( ) - > exists ( to ) )
{
if ( remove_new_dir_if_exists )
{
Names files ;
volume - > getDisk ( ) - > listFiles ( to , files ) ;
if ( log )
LOG_WARNING ( log ,
" Part directory {} already exists and contains {} files. Removing it. " ,
fullPath ( volume - > getDisk ( ) , to ) , files . size ( ) ) ;
2023-01-25 17:34:09 +00:00
executeWriteOperation ( [ & ] ( auto & disk ) { disk . removeRecursive ( to ) ; } ) ;
2022-06-20 18:18:17 +00:00
}
else
{
throw Exception (
ErrorCodes : : DIRECTORY_ALREADY_EXISTS ,
" Part directory {} already exists " ,
fullPath ( volume - > getDisk ( ) , to ) ) ;
}
}
2023-01-25 17:34:09 +00:00
2022-06-20 18:18:17 +00:00
String from = getRelativePath ( ) ;
/// Why?
2023-01-25 17:34:09 +00:00
executeWriteOperation ( [ & ] ( auto & disk )
2022-10-22 22:51:59 +00:00
{
disk . setLastModified ( from , Poco : : Timestamp : : fromEpochTime ( time ( nullptr ) ) ) ;
disk . moveDirectory ( from , to ) ;
2023-01-24 10:32:01 +00:00
/// Only after moveDirectory() since before the directory does not exists.
SyncGuardPtr to_sync_guard ;
if ( fsync_part_dir )
to_sync_guard = volume - > getDisk ( ) - > getDirectorySyncGuard ( to ) ;
2022-10-22 22:51:59 +00:00
} ) ;
2022-06-20 18:18:17 +00:00
part_dir = new_part_dir ;
root_path = new_root_path ;
}
2023-01-25 17:34:09 +00:00
void DataPartStorageOnDiskBase : : remove (
CanRemoveCallback & & can_remove_callback ,
const MergeTreeDataPartChecksums & checksums ,
std : : list < ProjectionChecksums > projections ,
bool is_temp ,
Poco : : Logger * log )
{
/// NOTE We rename part to delete_tmp_<relative_path> instead of delete_tmp_<name> to avoid race condition
/// when we try to remove two parts with the same name, but different relative paths,
/// for example all_1_2_1 (in Deleting state) and tmp_merge_all_1_2_1 (in Temporary state).
fs : : path from = fs : : path ( root_path ) / part_dir ;
// TODO directory delete_tmp_<name> is never removed if server crashes before returning from this function
/// Cut last "/" if it exists (it shouldn't). Otherwise fs::path behave differently.
fs : : path part_dir_without_slash = part_dir . ends_with ( " / " ) ? part_dir . substr ( 0 , part_dir . size ( ) - 1 ) : part_dir ;
/// NOTE relative_path can contain not only part name itself, but also some prefix like
/// "moving/all_1_1_1" or "detached/all_2_3_5". We should handle this case more properly.
/// File might be already renamed on previous try
bool has_delete_prefix = part_dir_without_slash . filename ( ) . string ( ) . starts_with ( " delete_tmp_ " ) ;
std : : optional < CanRemoveDescription > can_remove_description ;
auto disk = volume - > getDisk ( ) ;
fs : : path to = fs : : path ( root_path ) / part_dir_without_slash ;
if ( ! has_delete_prefix )
{
if ( part_dir_without_slash . has_parent_path ( ) )
{
auto parent_path = part_dir_without_slash . parent_path ( ) ;
if ( parent_path = = " detached " )
throw Exception (
ErrorCodes : : LOGICAL_ERROR ,
" Trying to remove detached part {} with path {} in remove function. It shouldn't happen " ,
part_dir ,
root_path ) ;
part_dir_without_slash = parent_path / ( " delete_tmp_ " + std : : string { part_dir_without_slash . filename ( ) } ) ;
}
else
{
part_dir_without_slash = ( " delete_tmp_ " + std : : string { part_dir_without_slash . filename ( ) } ) ;
}
to = fs : : path ( root_path ) / part_dir_without_slash ;
if ( disk - > exists ( to ) )
{
LOG_WARNING ( log , " Directory {} (to which part must be renamed before removing) already exists. "
" Most likely this is due to unclean restart or race condition. Removing it. " , fullPath ( disk , to ) ) ;
try
{
can_remove_description . emplace ( can_remove_callback ( ) ) ;
disk - > removeSharedRecursive (
fs : : path ( to ) / " " , ! can_remove_description - > can_remove_anything , can_remove_description - > files_not_to_remove ) ;
}
catch ( . . . )
{
LOG_ERROR (
log , " Cannot recursively remove directory {}. Exception: {} " , fullPath ( disk , to ) , getCurrentExceptionMessage ( false ) ) ;
throw ;
}
}
try
{
disk - > moveDirectory ( from , to ) ;
part_dir = part_dir_without_slash ;
}
catch ( const Exception & e )
{
if ( e . code ( ) = = ErrorCodes : : FILE_DOESNT_EXIST )
{
LOG_ERROR ( log , " Directory {} (part to remove) doesn't exist or one of nested files has gone. Most likely this is due to manual removing. This should be discouraged. Ignoring. " , fullPath ( disk , from ) ) ;
return ;
}
throw ;
}
catch ( const fs : : filesystem_error & e )
{
if ( e . code ( ) = = std : : errc : : no_such_file_or_directory )
{
LOG_ERROR ( log , " Directory {} (part to remove) doesn't exist or one of nested files has gone. "
" Most likely this is due to manual removing. This should be discouraged. Ignoring. " , fullPath ( disk , from ) ) ;
return ;
}
throw ;
}
}
if ( ! can_remove_description )
can_remove_description . emplace ( can_remove_callback ( ) ) ;
// Record existing projection directories so we don't remove them twice
std : : unordered_set < String > projection_directories ;
std : : string proj_suffix = " .proj " ;
for ( const auto & projection : projections )
{
std : : string proj_dir_name = projection . name + proj_suffix ;
projection_directories . emplace ( proj_dir_name ) ;
NameSet files_not_to_remove_for_projection ;
for ( const auto & file_name : can_remove_description - > files_not_to_remove )
if ( file_name . starts_with ( proj_dir_name ) )
files_not_to_remove_for_projection . emplace ( fs : : path ( file_name ) . filename ( ) ) ;
LOG_DEBUG ( log , " Will not remove files [{}] for projection {} " , fmt : : join ( files_not_to_remove_for_projection , " , " ) , projection . name ) ;
CanRemoveDescription proj_description
{
can_remove_description - > can_remove_anything ,
std : : move ( files_not_to_remove_for_projection ) ,
} ;
clearDirectory ( fs : : path ( to ) / proj_dir_name , proj_description , projection . checksums , is_temp , log ) ;
}
/// It is possible that we are removing the part which have a written but not loaded projection.
/// Such a part can appear server was restarted after DROP PROJECTION but before old part was removed.
/// In this case, the old part will load only projections from metadata.
/// See test 01701_clear_projection_and_part.
for ( const auto & [ name , _ ] : checksums . files )
{
if ( endsWith ( name , proj_suffix ) & & ! projection_directories . contains ( name ) )
{
static constexpr auto checksums_name = " checksums.txt " ;
auto projection_storage = create ( volume , to , name , /*initialize=*/ true ) ;
/// If we have a directory with suffix '.proj' it is likely a projection.
/// Try to load checksums for it (to avoid recursive removing fallback).
if ( projection_storage - > exists ( checksums_name ) )
{
try
{
MergeTreeDataPartChecksums tmp_checksums ;
auto in = projection_storage - > readFile ( checksums_name , { } , { } , { } ) ;
tmp_checksums . read ( * in ) ;
clearDirectory ( fs : : path ( to ) / name , * can_remove_description , tmp_checksums , is_temp , log ) ;
}
catch ( . . . )
{
LOG_ERROR ( log , " Cannot load checksums from {} " , fs : : path ( projection_storage - > getRelativePath ( ) ) / checksums_name ) ;
}
}
}
}
clearDirectory ( to , * can_remove_description , checksums , is_temp , log ) ;
}
void DataPartStorageOnDiskBase : : clearDirectory (
const std : : string & dir ,
const CanRemoveDescription & can_remove_description ,
const MergeTreeDataPartChecksums & checksums ,
bool is_temp ,
Poco : : Logger * log )
{
auto disk = volume - > getDisk ( ) ;
auto [ can_remove_shared_data , names_not_to_remove ] = can_remove_description ;
names_not_to_remove = getActualFileNamesOnDisk ( names_not_to_remove ) ;
/// It does not make sense to try fast path for incomplete temporary parts, because some files are probably absent.
/// Sometimes we add something to checksums.files before actually writing checksums and columns on disk.
/// Also sometimes we write checksums.txt and columns.txt in arbitrary order, so this check becomes complex...
bool incomplete_temporary_part = is_temp & & ( ! disk - > exists ( fs : : path ( dir ) / " checksums.txt " ) | | ! disk - > exists ( fs : : path ( dir ) / " columns.txt " ) ) ;
if ( checksums . empty ( ) | | incomplete_temporary_part )
{
/// If the part is not completely written, we cannot use fast path by listing files.
disk - > removeSharedRecursive ( fs : : path ( dir ) / " " , ! can_remove_shared_data , names_not_to_remove ) ;
return ;
}
try
{
NameSet names_to_remove = { " checksums.txt " , " columns.txt " } ;
for ( const auto & [ file , _ ] : checksums . files )
if ( ! endsWith ( file , " .proj " ) )
names_to_remove . emplace ( file ) ;
names_to_remove = getActualFileNamesOnDisk ( names_to_remove ) ;
/// Remove each expected file in directory, then remove directory itself.
RemoveBatchRequest request ;
for ( const auto & file : names_to_remove )
request . emplace_back ( fs : : path ( dir ) / file ) ;
request . emplace_back ( fs : : path ( dir ) / " default_compression_codec.txt " , true ) ;
request . emplace_back ( fs : : path ( dir ) / " delete-on-destroy.txt " , true ) ;
request . emplace_back ( fs : : path ( dir ) / " txn_version.txt " , true ) ;
2023-02-14 12:31:38 +00:00
/// Inverted index
request . emplace_back ( fs : : path ( dir ) / " skp_idx_af.gin_dict " , true ) ;
request . emplace_back ( fs : : path ( dir ) / " skp_idx_af.gin_post " , true ) ;
request . emplace_back ( fs : : path ( dir ) / " skp_idx_af.gin_seg " , true ) ;
request . emplace_back ( fs : : path ( dir ) / " skp_idx_af.gin_sid " , true ) ;
2023-01-25 17:34:09 +00:00
disk - > removeSharedFiles ( request , ! can_remove_shared_data , names_not_to_remove ) ;
disk - > removeDirectory ( dir ) ;
}
catch ( . . . )
{
/// Recursive directory removal does many excessive "stat" syscalls under the hood.
LOG_ERROR ( log , " Cannot quickly remove directory {} by removing files; fallback to recursive removal. Reason: {} " , fullPath ( disk , dir ) , getCurrentExceptionMessage ( false ) ) ;
disk - > removeSharedRecursive ( fs : : path ( dir ) / " " , ! can_remove_shared_data , names_not_to_remove ) ;
}
}
void DataPartStorageOnDiskBase : : changeRootPath ( const std : : string & from_root , const std : : string & to_root )
2022-06-20 18:18:17 +00:00
{
/// This is a very dumb implementation, here for root path like
/// "some/current/path/to/part" and change like
/// "some/current" -> "other/different", we just replace prefix to make new root like
/// "other/different/path/to/part".
/// Here we expect that actual move was done by somebody else.
size_t prefix_size = from_root . size ( ) ;
if ( prefix_size > 0 & & from_root . back ( ) = = ' / ' )
- - prefix_size ;
if ( prefix_size > root_path . size ( )
2022-10-24 22:38:53 +00:00
| | std : : string_view ( from_root ) . substr ( 0 , prefix_size ) ! = std : : string_view ( root_path ) . substr ( 0 , prefix_size ) )
2022-06-20 18:18:17 +00:00
throw Exception (
ErrorCodes : : LOGICAL_ERROR ,
" Cannot change part root to {} because it is not a prefix of current root {} " ,
from_root , root_path ) ;
size_t dst_size = to_root . size ( ) ;
if ( dst_size > 0 & & to_root . back ( ) = = ' / ' )
- - dst_size ;
root_path = to_root . substr ( 0 , dst_size ) + root_path . substr ( prefix_size ) ;
}
2022-04-19 19:34:41 +00:00
2023-01-25 17:34:09 +00:00
SyncGuardPtr DataPartStorageOnDiskBase : : getDirectorySyncGuard ( ) const
2022-05-05 09:19:12 +00:00
{
2022-10-22 22:51:59 +00:00
return volume - > getDisk ( ) - > getDirectorySyncGuard ( fs : : path ( root_path ) / part_dir ) ;
2022-04-12 18:59:49 +00:00
}
2023-01-25 17:34:09 +00:00
std : : unique_ptr < WriteBufferFromFileBase > DataPartStorageOnDiskBase : : writeTransactionFile ( WriteMode mode ) const
2022-10-23 22:29:24 +00:00
{
return volume - > getDisk ( ) - > writeFile ( fs : : path ( root_path ) / part_dir / " txn_version.txt " , 256 , mode ) ;
}
2023-01-25 17:34:09 +00:00
void DataPartStorageOnDiskBase : : removeRecursive ( )
2022-04-12 18:59:49 +00:00
{
2023-01-25 17:34:09 +00:00
executeWriteOperation ( [ & ] ( auto & disk ) { disk . removeRecursive ( fs : : path ( root_path ) / part_dir ) ; } ) ;
2022-04-12 18:59:49 +00:00
}
2023-01-25 17:34:09 +00:00
void DataPartStorageOnDiskBase : : removeSharedRecursive ( bool keep_in_remote_fs )
2022-04-21 19:19:13 +00:00
{
2023-01-25 17:34:09 +00:00
executeWriteOperation ( [ & ] ( auto & disk ) { disk . removeSharedRecursive ( fs : : path ( root_path ) / part_dir , keep_in_remote_fs , { } ) ; } ) ;
2022-04-21 19:19:13 +00:00
}
2023-01-25 17:34:09 +00:00
void DataPartStorageOnDiskBase : : createDirectories ( )
2022-04-12 18:59:49 +00:00
{
2023-01-25 17:34:09 +00:00
executeWriteOperation ( [ & ] ( auto & disk ) { disk . createDirectories ( fs : : path ( root_path ) / part_dir ) ; } ) ;
2022-04-12 18:59:49 +00:00
}
2023-01-25 17:34:09 +00:00
bool DataPartStorageOnDiskBase : : hasActiveTransaction ( ) const
2022-04-12 18:59:49 +00:00
{
2023-01-25 17:34:09 +00:00
return transaction ! = nullptr ;
2022-06-23 16:21:46 +00:00
}
2022-04-05 19:12:48 +00:00
}