2022-08-12 09:32:13 +00:00
|
|
|
#include <Storages/MergeTree/ReplicatedMergeTreeAttachThread.h>
|
|
|
|
#include <Storages/StorageReplicatedMergeTree.h>
|
2022-08-19 08:17:02 +00:00
|
|
|
#include "Common/ZooKeeper/IKeeper.h"
|
2022-08-12 09:32:13 +00:00
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2022-08-12 11:56:46 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
|
|
|
extern const int ABORTED;
|
|
|
|
}
|
|
|
|
|
2022-08-12 09:32:13 +00:00
|
|
|
ReplicatedMergeTreeAttachThread::ReplicatedMergeTreeAttachThread(StorageReplicatedMergeTree & storage_)
|
|
|
|
: storage(storage_)
|
|
|
|
, log_name(storage.getStorageID().getFullTableName() + " (ReplicatedMergeTreeAttachThread)")
|
|
|
|
, log(&Poco::Logger::get(log_name))
|
|
|
|
{
|
|
|
|
task = storage.getContext()->getSchedulePool().createTask(log_name, [this] { run(); });
|
2022-08-16 11:20:58 +00:00
|
|
|
const auto storage_settings = storage.getSettings();
|
|
|
|
retry_period = storage_settings->initialization_retry_period.totalSeconds();
|
2022-08-12 09:32:13 +00:00
|
|
|
}
|
|
|
|
|
2022-08-17 08:28:53 +00:00
|
|
|
ReplicatedMergeTreeAttachThread::~ReplicatedMergeTreeAttachThread()
|
|
|
|
{
|
|
|
|
shutdown();
|
|
|
|
}
|
|
|
|
|
2022-08-12 09:32:13 +00:00
|
|
|
void ReplicatedMergeTreeAttachThread::shutdown()
|
|
|
|
{
|
2022-08-17 08:28:53 +00:00
|
|
|
if (!shutdown_called.exchange(true))
|
|
|
|
task->deactivate();
|
2022-08-12 09:32:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ReplicatedMergeTreeAttachThread::run()
|
|
|
|
{
|
2022-08-19 08:17:02 +00:00
|
|
|
bool needs_retry{false};
|
2022-08-12 09:32:13 +00:00
|
|
|
try
|
|
|
|
{
|
2022-08-19 08:17:02 +00:00
|
|
|
runImpl();
|
|
|
|
finalizeInitialization();
|
|
|
|
}
|
|
|
|
catch (const Exception & e)
|
|
|
|
{
|
|
|
|
if (const auto * coordination_exception = dynamic_cast<const Coordination::Exception *>(&e))
|
2022-08-17 08:28:53 +00:00
|
|
|
{
|
2022-08-19 08:17:02 +00:00
|
|
|
std::array retriable_errors{
|
|
|
|
Coordination::Error::ZCONNECTIONLOSS, Coordination::Error::ZSESSIONEXPIRED, Coordination::Error::ZOPERATIONTIMEOUT};
|
|
|
|
needs_retry = std::any_of(
|
|
|
|
retriable_errors.begin(), retriable_errors.end(), [&](const auto error) { return error == coordination_exception->code; });
|
2022-08-17 08:28:53 +00:00
|
|
|
}
|
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
if (!needs_retry)
|
2022-08-17 08:28:53 +00:00
|
|
|
{
|
2022-08-19 08:17:02 +00:00
|
|
|
LOG_ERROR(log, "Initialization failed, table will remain readonly. Error: {}", e.message());
|
|
|
|
{
|
|
|
|
std::lock_guard lock(storage.initialization_mutex);
|
|
|
|
storage.init_phase = StorageReplicatedMergeTree::InitializationPhase::INITIALIZATION_DONE;
|
|
|
|
}
|
2022-08-17 08:28:53 +00:00
|
|
|
}
|
2022-08-19 08:17:02 +00:00
|
|
|
}
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
if (!first_try_done.exchange(true))
|
|
|
|
first_try_done.notify_one();
|
2022-08-16 08:19:02 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
if (shutdown_called)
|
|
|
|
{
|
|
|
|
LOG_WARNING(log, "Shutdown called, cancelling initialization");
|
|
|
|
return;
|
|
|
|
}
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
if (needs_retry)
|
|
|
|
task->scheduleAfter(retry_period * 1000);
|
|
|
|
}
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
void ReplicatedMergeTreeAttachThread::runImpl()
|
|
|
|
{
|
|
|
|
LOG_INFO(log, "Table will be in readonly mode until initialization is finished");
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
if (first_try_done || !zookeeper)
|
|
|
|
storage.setZooKeeper();
|
2022-08-16 08:19:02 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
const auto & zookeeper_path = storage.zookeeper_path;
|
|
|
|
bool metadata_exists = zookeeper->exists(zookeeper_path + "/metadata");
|
|
|
|
if (!metadata_exists)
|
|
|
|
{
|
|
|
|
LOG_WARNING(log, "No metadata in ZooKeeper for {}: table will stay in readonly mode.", zookeeper_path);
|
|
|
|
storage.has_metadata_in_zookeeper = false;
|
|
|
|
finalizeInitialization();
|
|
|
|
return;
|
|
|
|
}
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
auto metadata_snapshot = storage.getInMemoryMetadataPtr();
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
const auto & replica_path = storage.replica_path;
|
|
|
|
/// May it be ZK lost not the whole root, so the upper check passed, but only the /replicas/replica
|
|
|
|
/// folder.
|
|
|
|
bool replica_path_exists = zookeeper->exists(replica_path);
|
|
|
|
if (!replica_path_exists)
|
|
|
|
{
|
|
|
|
LOG_WARNING(log, "No metadata in ZooKeeper for {}: table will stay in readonly mode", replica_path);
|
|
|
|
storage.has_metadata_in_zookeeper = false;
|
|
|
|
return;
|
|
|
|
}
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
storage.has_metadata_in_zookeeper = true;
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
/// In old tables this node may missing or be empty
|
|
|
|
String replica_metadata;
|
|
|
|
const bool replica_metadata_exists = zookeeper->tryGet(replica_path + "/metadata", replica_metadata);
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
if (!replica_metadata_exists || replica_metadata.empty())
|
|
|
|
{
|
|
|
|
/// We have to check shared node granularity before we create ours.
|
|
|
|
storage.other_replicas_fixed_granularity = storage.checkFixedGranularityInZookeeper(zookeeper);
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
ReplicatedMergeTreeTableMetadata current_metadata(storage, metadata_snapshot);
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
zookeeper->createOrUpdate(replica_path + "/metadata", current_metadata.toString(), zkutil::CreateMode::Persistent);
|
2022-08-12 09:32:13 +00:00
|
|
|
}
|
2022-08-19 08:17:02 +00:00
|
|
|
|
|
|
|
storage.checkTableStructure(zookeeper, replica_path, metadata_snapshot);
|
|
|
|
storage.checkParts(zookeeper, skip_sanity_checks);
|
|
|
|
|
|
|
|
if (zookeeper->exists(replica_path + "/metadata_version"))
|
2022-08-12 09:32:13 +00:00
|
|
|
{
|
2022-08-19 08:17:02 +00:00
|
|
|
storage.metadata_version = parse<int>(zookeeper->get(replica_path + "/metadata_version"));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
/// This replica was created with old clickhouse version, so we have
|
|
|
|
/// to take version of global node. If somebody will alter our
|
|
|
|
/// table, then we will fill /metadata_version node in zookeeper.
|
|
|
|
/// Otherwise on the next restart we can again use version from
|
|
|
|
/// shared metadata node because it was not changed.
|
|
|
|
Coordination::Stat metadata_stat;
|
|
|
|
zookeeper->get(zookeeper_path + "/metadata", &metadata_stat);
|
|
|
|
storage.metadata_version = metadata_stat.version;
|
|
|
|
}
|
2022-08-12 09:32:13 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
/// Temporary directories contain uninitialized results of Merges or Fetches (after forced restart),
|
|
|
|
/// don't allow to reinitialize them, delete each of them immediately.
|
|
|
|
storage.clearOldTemporaryDirectories(0, {"tmp_", "delete_tmp_", "tmp-fetch_"});
|
|
|
|
storage.clearOldWriteAheadLogs();
|
|
|
|
if (storage.getSettings()->merge_tree_enable_clear_old_broken_detached)
|
|
|
|
storage.clearOldBrokenPartsFromDetachedDirecory();
|
2022-08-17 08:28:53 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
storage.createNewZooKeeperNodes(zookeeper);
|
|
|
|
storage.syncPinnedPartUUIDs(zookeeper);
|
2022-08-17 08:28:53 +00:00
|
|
|
|
2022-08-19 08:17:02 +00:00
|
|
|
storage.createTableSharedID(zookeeper);
|
2022-08-12 09:32:13 +00:00
|
|
|
};
|
|
|
|
|
2022-08-16 08:19:02 +00:00
|
|
|
void ReplicatedMergeTreeAttachThread::finalizeInitialization()
|
|
|
|
{
|
|
|
|
LOG_INFO(log, "Table is initialized");
|
|
|
|
using enum StorageReplicatedMergeTree::InitializationPhase;
|
|
|
|
{
|
|
|
|
std::lock_guard lock(storage.initialization_mutex);
|
|
|
|
if (!storage.startup_called)
|
|
|
|
{
|
|
|
|
storage.init_phase = INITIALIZATION_DONE;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
storage.init_phase = STARTUP_IN_PROGRESS;
|
|
|
|
}
|
|
|
|
|
|
|
|
storage.startupImpl(std::move(zookeeper));
|
|
|
|
}
|
|
|
|
|
2022-08-12 09:32:13 +00:00
|
|
|
void ReplicatedMergeTreeAttachThread::setSkipSanityChecks(bool skip_sanity_checks_)
|
|
|
|
{
|
|
|
|
skip_sanity_checks = skip_sanity_checks_;
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|