mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-13 09:52:38 +00:00
157 lines
5.8 KiB
C++
157 lines
5.8 KiB
C++
#pragma once
|
|
|
|
#include <Coordination/CoordinationSettings.h>
|
|
#include <Coordination/KeeperSnapshotManager.h>
|
|
#include <Coordination/KeeperSnapshotManagerS3.h>
|
|
#include <Coordination/KeeperContext.h>
|
|
#include <Coordination/KeeperStorage.h>
|
|
|
|
#include <libnuraft/nuraft.hxx>
|
|
#include <Common/ConcurrentBoundedQueue.h>
|
|
#include <Common/logger_useful.h>
|
|
|
|
|
|
namespace DB
|
|
{
|
|
|
|
using ResponsesQueue = ConcurrentBoundedQueue<KeeperStorage::ResponseForSession>;
|
|
using SnapshotsQueue = ConcurrentBoundedQueue<CreateSnapshotTask>;
|
|
|
|
/// ClickHouse Keeper state machine. Wrapper for KeeperStorage.
|
|
/// Responsible for entries commit, snapshots creation and so on.
|
|
class KeeperStateMachine : public nuraft::state_machine
|
|
{
|
|
public:
|
|
KeeperStateMachine(
|
|
ResponsesQueue & responses_queue_,
|
|
SnapshotsQueue & snapshots_queue_,
|
|
const std::string & snapshots_path_,
|
|
const CoordinationSettingsPtr & coordination_settings_,
|
|
const KeeperContextPtr & keeper_context_,
|
|
KeeperSnapshotManagerS3 * snapshot_manager_s3_,
|
|
const std::string & superdigest_ = "");
|
|
|
|
/// Read state from the latest snapshot
|
|
void init();
|
|
|
|
static KeeperStorage::RequestForSession parseRequest(nuraft::buffer & data);
|
|
|
|
bool preprocess(const KeeperStorage::RequestForSession & request_for_session);
|
|
|
|
nuraft::ptr<nuraft::buffer> pre_commit(uint64_t log_idx, nuraft::buffer & data) override;
|
|
|
|
nuraft::ptr<nuraft::buffer> commit(const uint64_t log_idx, nuraft::buffer & data) override; /// NOLINT
|
|
|
|
/// Save new cluster config to our snapshot (copy of the config stored in StateManager)
|
|
void commit_config(const uint64_t log_idx, nuraft::ptr<nuraft::cluster_config> & new_conf) override; /// NOLINT
|
|
|
|
void rollback(uint64_t log_idx, nuraft::buffer & data) override;
|
|
|
|
// allow_missing - whether the transaction we want to rollback can be missing from storage
|
|
// (can happen in case of exception during preprocessing)
|
|
void rollbackRequest(const KeeperStorage::RequestForSession & request_for_session, bool allow_missing);
|
|
|
|
uint64_t last_commit_index() override { return last_committed_idx; }
|
|
|
|
/// Apply preliminarily saved (save_logical_snp_obj) snapshot to our state.
|
|
bool apply_snapshot(nuraft::snapshot & s) override;
|
|
|
|
nuraft::ptr<nuraft::snapshot> last_snapshot() override;
|
|
|
|
/// Create new snapshot from current state.
|
|
void create_snapshot(nuraft::snapshot & s, nuraft::async_result<bool>::handler_type & when_done) override;
|
|
|
|
/// Save snapshot which was send by leader to us. After that we will apply it in apply_snapshot.
|
|
void save_logical_snp_obj(nuraft::snapshot & s, uint64_t & obj_id, nuraft::buffer & data, bool is_first_obj, bool is_last_obj) override;
|
|
|
|
/// Better name is `serialize snapshot` -- save existing snapshot (created by create_snapshot) into
|
|
/// in-memory buffer data_out.
|
|
int read_logical_snp_obj(
|
|
nuraft::snapshot & s, void *& user_snp_ctx, uint64_t obj_id, nuraft::ptr<nuraft::buffer> & data_out, bool & is_last_obj) override;
|
|
|
|
/// just for test
|
|
KeeperStorage & getStorage() { return *storage; }
|
|
|
|
void shutdownStorage();
|
|
|
|
ClusterConfigPtr getClusterConfig() const;
|
|
|
|
/// Process local read request
|
|
void processReadRequest(const KeeperStorage::RequestForSession & request_for_session);
|
|
|
|
std::vector<int64_t> getDeadSessions();
|
|
|
|
int64_t getNextZxid() const;
|
|
|
|
KeeperStorage::Digest getNodesDigest() const;
|
|
|
|
/// Introspection functions for 4lw commands
|
|
uint64_t getLastProcessedZxid() const;
|
|
|
|
uint64_t getNodesCount() const;
|
|
uint64_t getTotalWatchesCount() const;
|
|
uint64_t getWatchedPathsCount() const;
|
|
uint64_t getSessionsWithWatchesCount() const;
|
|
|
|
void dumpWatches(WriteBufferFromOwnString & buf) const;
|
|
void dumpWatchesByPath(WriteBufferFromOwnString & buf) const;
|
|
void dumpSessionsAndEphemerals(WriteBufferFromOwnString & buf) const;
|
|
|
|
uint64_t getSessionWithEphemeralNodesCount() const;
|
|
uint64_t getTotalEphemeralNodesCount() const;
|
|
uint64_t getApproximateDataSize() const;
|
|
uint64_t getKeyArenaSize() const;
|
|
uint64_t getLatestSnapshotBufSize() const;
|
|
|
|
private:
|
|
/// In our state machine we always have a single snapshot which is stored
|
|
/// in memory in compressed (serialized) format.
|
|
SnapshotMetadataPtr latest_snapshot_meta = nullptr;
|
|
std::string latest_snapshot_path;
|
|
nuraft::ptr<nuraft::buffer> latest_snapshot_buf = nullptr;
|
|
|
|
CoordinationSettingsPtr coordination_settings;
|
|
|
|
/// Main state machine logic
|
|
KeeperStoragePtr storage;
|
|
|
|
/// Save/Load and Serialize/Deserialize logic for snapshots.
|
|
KeeperSnapshotManager snapshot_manager;
|
|
|
|
/// Put processed responses into this queue
|
|
ResponsesQueue & responses_queue;
|
|
|
|
/// Snapshots to create by snapshot thread
|
|
SnapshotsQueue & snapshots_queue;
|
|
|
|
/// Mutex for snapshots
|
|
mutable std::mutex snapshots_lock;
|
|
|
|
/// Lock for storage and responses_queue. It's important to process requests
|
|
/// and push them to the responses queue while holding this lock. Otherwise
|
|
/// we can get strange cases when, for example client send read request with
|
|
/// watch and after that receive watch response and only receive response
|
|
/// for request.
|
|
mutable std::mutex storage_and_responses_lock;
|
|
|
|
/// Last committed Raft log number.
|
|
std::atomic<uint64_t> last_committed_idx;
|
|
|
|
Poco::Logger * log;
|
|
|
|
/// Cluster config for our quorum.
|
|
/// It's a copy of config stored in StateManager, but here
|
|
/// we also write it to disk during snapshot. Must be used with lock.
|
|
mutable std::mutex cluster_config_lock;
|
|
ClusterConfigPtr cluster_config;
|
|
|
|
/// Special part of ACL system -- superdigest specified in server config.
|
|
const std::string superdigest;
|
|
|
|
KeeperContextPtr keeper_context;
|
|
|
|
KeeperSnapshotManagerS3 * snapshot_manager_s3;
|
|
};
|
|
|
|
}
|