ClickHouse/src/Storages/PostgreSQL/PostgreSQLReplicaConsumer.h

107 lines
3.5 KiB
C++
Raw Normal View History

#pragma once
2021-01-19 15:29:22 +00:00
#include "PostgreSQLConnection.h"
2021-02-03 16:13:18 +00:00
#include "PostgreSQLReplicaMetadata.h"
2021-02-06 12:28:42 +00:00
#include "pqxx/pqxx"
#include <Core/BackgroundSchedulePool.h>
#include <common/logger_useful.h>
2021-01-31 19:03:03 +00:00
#include <Storages/IStorage.h>
#include <Storages/PostgreSQL/insertPostgreSQLValue.h>
#include <DataStreams/OneBlockInputStream.h>
2021-02-06 12:28:42 +00:00
namespace DB
{
class PostgreSQLReplicaConsumer
{
public:
using Storages = std::unordered_map<String, StoragePtr>;
PostgreSQLReplicaConsumer(
std::shared_ptr<Context> context_,
2021-02-04 17:17:16 +00:00
PostgreSQLConnectionPtr connection_,
const std::string & replication_slot_name_,
const std::string & publication_name_,
2021-02-03 16:13:18 +00:00
const std::string & metadata_path,
2021-02-06 12:28:42 +00:00
const std::string & start_lsn,
2021-01-31 19:03:03 +00:00
const size_t max_block_size_,
Storages storages_);
/// Start reading WAL from current_lsn position. Initial data sync from created snapshot already done.
void startSynchronization();
void stopSynchronization();
private:
2021-01-31 19:03:03 +00:00
/// Executed by wal_reader_task. A separate thread reads wal and advances lsn to last commited position
/// after rows were written via copyData.
void replicationStream();
void stopReplicationStream();
2021-02-03 16:13:18 +00:00
enum class PostgreSQLQuery
{
INSERT,
UPDATE,
DELETE
};
bool readFromReplicationSlot();
void syncTables(std::shared_ptr<pqxx::nontransaction> tx, const std::unordered_set<std::string> & tables_to_sync);
String advanceLSN(std::shared_ptr<pqxx::nontransaction> ntx);
void processReplicationMessage(
const char * replication_message, size_t size, std::unordered_set<std::string> & tables_to_sync);
2021-02-03 16:13:18 +00:00
struct BufferData
{
ExternalResultDescription description;
MutableColumns columns;
/// Needed for insertPostgreSQLValue() method to parse array
std::unordered_map<size_t, PostgreSQLArrayInfo> array_info;
BufferData(const Block block)
{
description.init(block);
columns = description.sample_block.cloneEmptyColumns();
for (const auto idx : ext::range(0, description.sample_block.columns()))
if (description.types[idx].first == ExternalResultDescription::ValueType::vtArray)
preparePostgreSQLArrayInfo(array_info, idx, description.sample_block.getByPosition(idx).type);
}
};
using Buffers = std::unordered_map<String, BufferData>;
void insertDefaultValue(BufferData & buffer, size_t column_idx);
void insertValue(BufferData & buffer, const std::string & value, size_t column_idx);
void readTupleData(BufferData & buffer, const char * message, size_t & pos, PostgreSQLQuery type, bool old_value = false);
2021-01-31 19:03:03 +00:00
/// Methods to parse replication message data.
2021-01-19 15:29:22 +00:00
void readString(const char * message, size_t & pos, size_t size, String & result);
Int64 readInt64(const char * message, size_t & pos);
Int32 readInt32(const char * message, size_t & pos);
Int16 readInt16(const char * message, size_t & pos);
Int8 readInt8(const char * message, size_t & pos);
2021-01-27 15:29:28 +00:00
Poco::Logger * log;
std::shared_ptr<Context> context;
const std::string replication_slot_name;
const std::string publication_name;
2021-02-03 16:13:18 +00:00
PostgreSQLReplicaMetadata metadata;
2021-02-04 17:17:16 +00:00
PostgreSQLConnectionPtr connection;
2021-02-06 12:28:42 +00:00
std::string current_lsn, final_lsn;
const size_t max_block_size;
std::string table_to_insert;
2021-01-27 15:29:28 +00:00
BackgroundSchedulePool::TaskHolder wal_reader_task;
std::atomic<bool> stop_synchronization = false;
2021-01-31 19:03:03 +00:00
Storages storages;
Buffers buffers;
};
}