2020-11-03 13:47:26 +00:00
|
|
|
#pragma once
|
2021-04-10 23:33:54 +00:00
|
|
|
|
2020-11-03 13:47:26 +00:00
|
|
|
#include <Core/Types.h>
|
|
|
|
#include <Interpreters/Cluster.h>
|
2020-11-20 16:06:27 +00:00
|
|
|
#include <Common/ZooKeeper/Types.h>
|
2021-05-09 11:59:49 +00:00
|
|
|
#include <filesystem>
|
2020-11-03 13:47:26 +00:00
|
|
|
|
2020-11-27 14:04:03 +00:00
|
|
|
namespace Poco
|
|
|
|
{
|
|
|
|
class Logger;
|
|
|
|
}
|
2020-11-03 13:47:26 +00:00
|
|
|
|
2021-01-18 14:09:39 +00:00
|
|
|
namespace zkutil
|
|
|
|
{
|
|
|
|
class ZooKeeper;
|
|
|
|
}
|
|
|
|
|
2021-05-09 11:59:49 +00:00
|
|
|
namespace fs = std::filesystem;
|
|
|
|
|
2020-11-03 13:47:26 +00:00
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2021-07-02 16:39:55 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
|
|
|
extern const int LOGICAL_ERROR;
|
|
|
|
}
|
|
|
|
|
2020-11-03 13:47:26 +00:00
|
|
|
class ASTQueryWithOnCluster;
|
2020-11-20 16:06:27 +00:00
|
|
|
using ZooKeeperPtr = std::shared_ptr<zkutil::ZooKeeper>;
|
2021-03-09 17:05:24 +00:00
|
|
|
using ClusterPtr = std::shared_ptr<Cluster>;
|
2020-11-27 14:04:03 +00:00
|
|
|
class DatabaseReplicated;
|
2020-11-03 13:47:26 +00:00
|
|
|
|
2021-02-19 23:41:58 +00:00
|
|
|
class ZooKeeperMetadataTransaction;
|
|
|
|
using ZooKeeperMetadataTransactionPtr = std::shared_ptr<ZooKeeperMetadataTransaction>;
|
2020-12-04 20:12:32 +00:00
|
|
|
|
2020-11-03 13:47:26 +00:00
|
|
|
struct HostID
|
|
|
|
{
|
|
|
|
String host_name;
|
|
|
|
UInt16 port;
|
|
|
|
|
|
|
|
HostID() = default;
|
|
|
|
|
|
|
|
explicit HostID(const Cluster::Address & address)
|
|
|
|
: host_name(address.host_name), port(address.port) {}
|
|
|
|
|
|
|
|
static HostID fromString(const String & host_port_str);
|
|
|
|
|
|
|
|
String toString() const
|
|
|
|
{
|
|
|
|
return Cluster::Address::toString(host_name, port);
|
|
|
|
}
|
|
|
|
|
|
|
|
String readableString() const
|
|
|
|
{
|
|
|
|
return host_name + ":" + DB::toString(port);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool isLocalAddress(UInt16 clickhouse_port) const;
|
|
|
|
|
|
|
|
static String applyToString(const HostID & host_id)
|
|
|
|
{
|
|
|
|
return host_id.toString();
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
struct DDLLogEntry
|
|
|
|
{
|
2021-03-08 22:57:53 +00:00
|
|
|
UInt64 version = 1;
|
2020-11-03 13:47:26 +00:00
|
|
|
String query;
|
|
|
|
std::vector<HostID> hosts;
|
|
|
|
String initiator; // optional
|
2021-03-08 22:57:53 +00:00
|
|
|
std::optional<SettingsChanges> settings;
|
2020-11-03 13:47:26 +00:00
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
void setSettingsIfRequired(ContextPtr context);
|
2020-11-03 13:47:26 +00:00
|
|
|
String toString() const;
|
|
|
|
void parse(const String & data);
|
2021-03-08 22:57:53 +00:00
|
|
|
void assertVersion() const;
|
2020-11-03 13:47:26 +00:00
|
|
|
};
|
|
|
|
|
2020-11-27 14:04:03 +00:00
|
|
|
struct DDLTaskBase
|
|
|
|
{
|
|
|
|
const String entry_name;
|
|
|
|
const String entry_path;
|
|
|
|
|
|
|
|
DDLLogEntry entry;
|
|
|
|
|
|
|
|
String host_id_str;
|
|
|
|
ASTPtr query;
|
|
|
|
|
2021-02-01 19:29:47 +00:00
|
|
|
bool is_initial_query = false;
|
2020-11-27 14:04:03 +00:00
|
|
|
bool is_circular_replicated = false;
|
|
|
|
bool execute_on_leader = false;
|
2020-11-03 13:47:26 +00:00
|
|
|
|
2020-12-04 20:12:32 +00:00
|
|
|
Coordination::Requests ops;
|
2020-11-27 14:04:03 +00:00
|
|
|
ExecutionStatus execution_status;
|
|
|
|
bool was_executed = false;
|
|
|
|
|
2021-01-26 17:51:25 +00:00
|
|
|
std::atomic_bool completely_processed = false;
|
|
|
|
|
2020-11-29 11:45:32 +00:00
|
|
|
DDLTaskBase(const String & name, const String & path) : entry_name(name), entry_path(path) {}
|
2020-12-03 18:14:27 +00:00
|
|
|
DDLTaskBase(const DDLTaskBase &) = delete;
|
2020-11-29 11:45:32 +00:00
|
|
|
virtual ~DDLTaskBase() = default;
|
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
virtual void parseQueryFromEntry(ContextPtr context);
|
2020-11-29 11:45:32 +00:00
|
|
|
|
2020-11-27 14:04:03 +00:00
|
|
|
virtual String getShardID() const = 0;
|
|
|
|
|
2021-05-31 14:49:02 +00:00
|
|
|
virtual ContextMutablePtr makeQueryContext(ContextPtr from_context, const ZooKeeperPtr & zookeeper);
|
2022-05-06 16:37:20 +00:00
|
|
|
virtual Coordination::RequestPtr getOpToUpdateLogPointer() { return nullptr; }
|
2020-11-27 14:04:03 +00:00
|
|
|
|
2021-05-09 11:59:49 +00:00
|
|
|
inline String getActiveNodePath() const { return fs::path(entry_path) / "active" / host_id_str; }
|
|
|
|
inline String getFinishedNodePath() const { return fs::path(entry_path) / "finished" / host_id_str; }
|
|
|
|
inline String getShardNodePath() const { return fs::path(entry_path) / "shards" / getShardID(); }
|
2020-11-27 14:04:03 +00:00
|
|
|
|
2021-02-09 15:14:20 +00:00
|
|
|
static String getLogEntryName(UInt32 log_entry_number);
|
|
|
|
static UInt32 getLogEntryNumber(const String & log_entry_name);
|
2020-11-27 14:04:03 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
struct DDLTask : public DDLTaskBase
|
2020-11-03 13:47:26 +00:00
|
|
|
{
|
2020-11-27 14:04:03 +00:00
|
|
|
DDLTask(const String & name, const String & path) : DDLTaskBase(name, path) {}
|
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
bool findCurrentHostID(ContextPtr global_context, Poco::Logger * log);
|
2020-11-27 14:04:03 +00:00
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
void setClusterInfo(ContextPtr context, Poco::Logger * log);
|
2020-11-03 13:47:26 +00:00
|
|
|
|
2020-11-27 14:04:03 +00:00
|
|
|
String getShardID() const override;
|
|
|
|
|
|
|
|
private:
|
|
|
|
bool tryFindHostInCluster();
|
2021-04-10 23:33:54 +00:00
|
|
|
bool tryFindHostInClusterViaResolving(ContextPtr context);
|
2020-11-27 14:04:03 +00:00
|
|
|
|
|
|
|
HostID host_id;
|
2020-11-03 13:47:26 +00:00
|
|
|
String cluster_name;
|
|
|
|
ClusterPtr cluster;
|
|
|
|
Cluster::Address address_in_cluster;
|
2021-05-08 15:20:40 +00:00
|
|
|
size_t host_shard_num = 0;
|
|
|
|
size_t host_replica_num = 0;
|
2020-11-27 14:04:03 +00:00
|
|
|
};
|
2020-11-03 13:47:26 +00:00
|
|
|
|
2020-11-27 14:04:03 +00:00
|
|
|
struct DatabaseReplicatedTask : public DDLTaskBase
|
|
|
|
{
|
|
|
|
DatabaseReplicatedTask(const String & name, const String & path, DatabaseReplicated * database_);
|
2020-11-03 13:47:26 +00:00
|
|
|
|
2020-11-27 14:04:03 +00:00
|
|
|
String getShardID() const override;
|
2021-04-10 23:33:54 +00:00
|
|
|
void parseQueryFromEntry(ContextPtr context) override;
|
2021-05-31 14:49:02 +00:00
|
|
|
ContextMutablePtr makeQueryContext(ContextPtr from_context, const ZooKeeperPtr & zookeeper) override;
|
2022-05-06 16:37:20 +00:00
|
|
|
Coordination::RequestPtr getOpToUpdateLogPointer() override;
|
2020-11-20 16:06:27 +00:00
|
|
|
|
2020-11-27 14:04:03 +00:00
|
|
|
DatabaseReplicated * database;
|
2020-11-03 13:47:26 +00:00
|
|
|
};
|
|
|
|
|
2021-02-19 23:41:58 +00:00
|
|
|
/// The main purpose of ZooKeeperMetadataTransaction is to execute all zookeeper operation related to query
|
|
|
|
/// in a single transaction when we performed all required checks and ready to "commit" changes.
|
|
|
|
/// For example, create ALTER_METADATA entry in ReplicatedMergeTree log,
|
|
|
|
/// create path/to/entry/finished/host_id node in distributed DDL queue to mark query as executed and
|
|
|
|
/// update metadata in path/to/replicated_database/metadata/table_name
|
|
|
|
/// It's used for DatabaseReplicated.
|
|
|
|
/// TODO we can also use it for ordinary ON CLUSTER queries
|
|
|
|
class ZooKeeperMetadataTransaction
|
2020-11-20 16:06:27 +00:00
|
|
|
{
|
2020-12-04 20:12:32 +00:00
|
|
|
enum State
|
|
|
|
{
|
|
|
|
CREATED,
|
2021-02-08 19:36:17 +00:00
|
|
|
COMMITTED,
|
2020-12-04 20:12:32 +00:00
|
|
|
FAILED
|
|
|
|
};
|
|
|
|
|
|
|
|
State state = CREATED;
|
2020-11-20 16:06:27 +00:00
|
|
|
ZooKeeperPtr current_zookeeper;
|
|
|
|
String zookeeper_path;
|
2020-11-29 11:45:32 +00:00
|
|
|
bool is_initial_query;
|
2021-07-06 10:26:03 +00:00
|
|
|
String task_path;
|
2020-11-20 16:06:27 +00:00
|
|
|
Coordination::Requests ops;
|
|
|
|
|
2021-02-19 23:41:58 +00:00
|
|
|
public:
|
2021-07-06 10:26:03 +00:00
|
|
|
ZooKeeperMetadataTransaction(const ZooKeeperPtr & current_zookeeper_, const String & zookeeper_path_, bool is_initial_query_, const String & task_path_)
|
2021-02-19 23:41:58 +00:00
|
|
|
: current_zookeeper(current_zookeeper_)
|
|
|
|
, zookeeper_path(zookeeper_path_)
|
|
|
|
, is_initial_query(is_initial_query_)
|
2021-07-06 10:26:03 +00:00
|
|
|
, task_path(task_path_)
|
2021-02-19 23:41:58 +00:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
bool isInitialQuery() const { return is_initial_query; }
|
|
|
|
|
|
|
|
bool isExecuted() const { return state != CREATED; }
|
|
|
|
|
|
|
|
String getDatabaseZooKeeperPath() const { return zookeeper_path; }
|
|
|
|
|
2021-07-06 10:26:03 +00:00
|
|
|
String getTaskZooKeeperPath() const { return task_path; }
|
|
|
|
|
2021-07-02 16:39:55 +00:00
|
|
|
ZooKeeperPtr getZooKeeper() const { return current_zookeeper; }
|
|
|
|
|
2021-02-19 23:41:58 +00:00
|
|
|
void addOp(Coordination::RequestPtr && op)
|
|
|
|
{
|
2021-07-02 16:39:55 +00:00
|
|
|
if (isExecuted())
|
|
|
|
throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add ZooKeeper operation because query is executed. It's a bug.");
|
2021-02-19 23:41:58 +00:00
|
|
|
ops.emplace_back(op);
|
|
|
|
}
|
|
|
|
|
2021-02-08 19:36:17 +00:00
|
|
|
void moveOpsTo(Coordination::Requests & other_ops)
|
2020-11-20 16:06:27 +00:00
|
|
|
{
|
2021-07-02 16:39:55 +00:00
|
|
|
if (isExecuted())
|
|
|
|
throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add ZooKeeper operation because query is executed. It's a bug.");
|
2020-11-20 16:06:27 +00:00
|
|
|
std::move(ops.begin(), ops.end(), std::back_inserter(other_ops));
|
2021-01-28 19:02:39 +00:00
|
|
|
ops.clear();
|
2021-02-08 19:36:17 +00:00
|
|
|
state = COMMITTED;
|
2020-11-20 16:06:27 +00:00
|
|
|
}
|
2020-11-29 11:45:32 +00:00
|
|
|
|
|
|
|
void commit();
|
2020-12-04 20:12:32 +00:00
|
|
|
|
2021-07-30 16:34:18 +00:00
|
|
|
~ZooKeeperMetadataTransaction() { assert(isExecuted() || std::uncaught_exceptions() || ops.empty()); }
|
2020-11-20 16:06:27 +00:00
|
|
|
};
|
|
|
|
|
2021-03-09 17:05:24 +00:00
|
|
|
ClusterPtr tryGetReplicatedDatabaseCluster(const String & cluster_name);
|
|
|
|
|
2020-11-03 13:47:26 +00:00
|
|
|
}
|