ClickHouse/utils/keeper-bench/Runner.cpp

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

466 lines
16 KiB
C++
Raw Normal View History

2021-04-13 12:36:47 +00:00
#include "Runner.h"
2023-04-07 13:02:42 +00:00
#include <Poco/Util/AbstractConfiguration.h>
2021-04-13 12:36:47 +00:00
2023-04-07 13:02:42 +00:00
#include "Common/ZooKeeper/ZooKeeperCommon.h"
#include "Common/ZooKeeper/ZooKeeperConstants.h"
2023-04-07 14:14:39 +00:00
#include <Common/EventNotifier.h>
2023-04-06 15:10:58 +00:00
#include <Common/Config/ConfigProcessor.h>
2023-04-17 11:25:46 +00:00
#include "IO/ReadBufferFromString.h"
#include <IO/WriteBufferFromFile.h>
#include <IO/WriteBufferFromString.h>
#include <IO/copyData.h>
2023-04-14 13:32:08 +00:00
2023-04-14 13:32:08 +00:00
namespace CurrentMetrics
{
extern const Metric LocalThread;
extern const Metric LocalThreadActive;
extern const Metric LocalThreadScheduled;
2023-04-14 13:32:08 +00:00
}
2023-04-06 15:10:58 +00:00
namespace DB::ErrorCodes
2021-04-13 12:36:47 +00:00
{
extern const int CANNOT_BLOCK_SIGNAL;
2023-04-14 13:32:08 +00:00
extern const int BAD_ARGUMENTS;
2021-04-13 12:36:47 +00:00
}
2023-04-06 15:10:58 +00:00
Runner::Runner(
2023-04-07 14:14:39 +00:00
std::optional<size_t> concurrency_,
2023-04-06 15:10:58 +00:00
const std::string & config_path,
const Strings & hosts_strings_,
2023-04-07 14:14:39 +00:00
std::optional<double> max_time_,
std::optional<double> delay_,
std::optional<bool> continue_on_error_,
std::optional<size_t> max_iterations_)
: info(std::make_shared<Stats>())
2023-04-07 13:02:42 +00:00
{
2023-04-06 15:10:58 +00:00
2023-04-07 15:20:36 +00:00
DB::ConfigProcessor config_processor(config_path, true, false);
auto config = config_processor.loadConfig().configuration;
2021-04-13 12:36:47 +00:00
2023-04-07 15:20:36 +00:00
generator.emplace(*config);
2023-04-07 13:02:42 +00:00
if (!hosts_strings_.empty())
{
for (const auto & host : hosts_strings_)
connection_infos.push_back({.host = host});
}
else
{
if (!config)
throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "No config file or hosts defined");
parseHostsFromConfig(*config);
}
2023-04-07 14:14:39 +00:00
2023-04-14 13:32:08 +00:00
std::cerr << "---- Run options ---- " << std::endl;
2023-04-07 15:20:36 +00:00
static constexpr uint64_t DEFAULT_CONCURRENCY = 1;
2023-04-07 14:14:39 +00:00
if (concurrency_)
concurrency = *concurrency_;
else
2023-04-07 15:20:36 +00:00
concurrency = config->getUInt64("concurrency", DEFAULT_CONCURRENCY);
2023-04-14 13:32:08 +00:00
std::cerr << "Concurrency: " << concurrency << std::endl;
2023-04-07 14:14:39 +00:00
2023-04-07 15:20:36 +00:00
static constexpr uint64_t DEFAULT_ITERATIONS = 0;
2023-04-07 14:14:39 +00:00
if (max_iterations_)
max_iterations = *max_iterations_;
else
2023-04-07 15:20:36 +00:00
max_iterations = config->getUInt64("iterations", DEFAULT_ITERATIONS);
2023-04-14 13:32:08 +00:00
std::cerr << "Iterations: " << max_iterations << std::endl;
2023-04-07 14:14:39 +00:00
2023-04-07 15:20:36 +00:00
static constexpr double DEFAULT_DELAY = 1.0;
2023-04-07 14:14:39 +00:00
if (delay_)
delay = *delay_;
else
2023-04-07 15:20:36 +00:00
delay = config->getDouble("report_delay", DEFAULT_DELAY);
2023-04-14 13:32:08 +00:00
std::cerr << "Report delay: " << delay << std::endl;
2023-04-07 14:14:39 +00:00
2023-04-14 13:32:08 +00:00
static constexpr double DEFAULT_TIME_LIMIT = 0.0;
2023-04-07 14:14:39 +00:00
if (max_time_)
max_time = *max_time_;
else
2023-04-07 15:20:36 +00:00
max_time = config->getDouble("timelimit", DEFAULT_TIME_LIMIT);
2023-04-14 13:32:08 +00:00
std::cerr << "Time limit: " << max_time << std::endl;
2023-04-07 14:14:39 +00:00
if (continue_on_error_)
continue_on_error = *continue_on_error_;
else
2023-04-07 15:20:36 +00:00
continue_on_error = config->getBool("continue_on_error", false);
2023-04-14 13:32:08 +00:00
std::cerr << "Continue on error: " << continue_on_error << std::endl;
2023-04-17 11:25:46 +00:00
static const std::string output_key = "output";
print_to_stdout = config->getBool(output_key + ".stdout", false);
std::cerr << "Printing output to stdout: " << print_to_stdout << std::endl;
static const std::string output_file_key = output_key + ".file";
if (config->has(output_file_key))
{
if (config->has(output_file_key + ".path"))
{
file_output = config->getString(output_file_key + ".path");
output_file_with_timestamp = config->getBool(output_file_key + ".with_timestamp");
}
else
file_output = config->getString(output_file_key);
std::cerr << "Result file path: " << file_output->string() << std::endl;
}
2023-04-14 13:32:08 +00:00
std::cerr << "---- Run options ----\n" << std::endl;
2023-04-07 14:14:39 +00:00
pool.emplace(CurrentMetrics::LocalThread, CurrentMetrics::LocalThreadActive, CurrentMetrics::LocalThreadScheduled, concurrency);
2023-04-07 14:14:39 +00:00
queue.emplace(concurrency);
2023-04-07 13:02:42 +00:00
}
void Runner::parseHostsFromConfig(const Poco::Util::AbstractConfiguration & config)
{
ConnectionInfo default_connection_info;
const auto fill_connection_details = [&](const std::string & key, auto & connection_info)
{
if (config.has(key + ".secure"))
connection_info.secure = config.getBool(key + ".secure");
if (config.has(key + ".session_timeout_ms"))
connection_info.session_timeout_ms = config.getInt(key + ".session_timeout_ms");
if (config.has(key + ".operation_timeout_ms"))
connection_info.operation_timeout_ms = config.getInt(key + ".operation_timeout_ms");
if (config.has(key + ".connection_timeout_ms"))
connection_info.connection_timeout_ms = config.getInt(key + ".connection_timeout_ms");
if (config.has(key + ".use_compression"))
connection_info.use_compression = config.getBool(key + ".use_compression");
2023-04-07 13:02:42 +00:00
};
fill_connection_details("connections", default_connection_info);
Poco::Util::AbstractConfiguration::Keys connections_keys;
config.keys("connections", connections_keys);
for (const auto & key : connections_keys)
{
std::string connection_key = "connections." + key;
auto connection_info = default_connection_info;
if (key.starts_with("host"))
{
connection_info.host = config.getString(connection_key);
connection_infos.push_back(std::move(connection_info));
}
else if (key.starts_with("connection") && key != "connection_timeout_ms")
{
connection_info.host = config.getString(connection_key + ".host");
if (config.has(connection_key + ".sessions"))
connection_info.sessions = config.getUInt64(connection_key + ".sessions");
fill_connection_details(connection_key, connection_info);
connection_infos.push_back(std::move(connection_info));
}
}
}
void Runner::thread(std::vector<std::shared_ptr<Coordination::ZooKeeper>> zookeepers)
2021-04-13 12:36:47 +00:00
{
Coordination::ZooKeeperRequestPtr request;
/// Randomly choosing connection index
pcg64 rng(randomSeed());
std::uniform_int_distribution<size_t> distribution(0, zookeepers.size() - 1);
/// In these threads we do not accept INT signal.
sigset_t sig_set;
if (sigemptyset(&sig_set)
|| sigaddset(&sig_set, SIGINT)
|| pthread_sigmask(SIG_BLOCK, &sig_set, nullptr))
{
2023-12-15 18:25:49 +00:00
throw DB::ErrnoException(DB::ErrorCodes::CANNOT_BLOCK_SIGNAL, "Cannot block signal");
2021-04-13 12:36:47 +00:00
}
while (true)
{
bool extracted = false;
while (!extracted)
{
2023-04-07 14:14:39 +00:00
extracted = queue->tryPop(request, 100);
2021-04-13 12:36:47 +00:00
if (shutdown
|| (max_iterations && requests_executed >= max_iterations))
{
return;
}
}
const auto connection_index = distribution(rng);
auto & zk = zookeepers[connection_index];
auto promise = std::make_shared<std::promise<size_t>>();
auto future = promise->get_future();
2023-04-07 14:51:25 +00:00
Coordination::ResponseCallback callback = [&request, promise](const Coordination::Response & response)
2021-04-13 12:36:47 +00:00
{
2023-04-07 14:51:25 +00:00
bool set_exception = true;
if (response.error == Coordination::Error::ZOK)
{
set_exception = false;
}
else if (response.error == Coordination::Error::ZNONODE)
{
/// remove can fail with ZNONODE because of different order of execution
2023-04-14 13:32:08 +00:00
/// of generated create and remove requests
2023-04-07 14:51:25 +00:00
/// this is okay for concurrent runs
if (dynamic_cast<const Coordination::ZooKeeperRemoveResponse *>(&response))
set_exception = false;
else if (const auto * multi_response = dynamic_cast<const Coordination::ZooKeeperMultiResponse *>(&response))
{
const auto & responses = multi_response->responses;
size_t i = 0;
while (responses[i]->error != Coordination::Error::ZNONODE)
++i;
const auto & multi_request = dynamic_cast<const Coordination::ZooKeeperMultiRequest &>(*request);
if (dynamic_cast<const Coordination::ZooKeeperRemoveRequest *>(&*multi_request.requests[i]))
set_exception = false;
}
}
if (set_exception)
2021-04-13 12:36:47 +00:00
promise->set_exception(std::make_exception_ptr(zkutil::KeeperException(response.error)));
else
promise->set_value(response.bytesSize());
};
Stopwatch watch;
zk->executeGenericRequest(request, callback);
try
{
auto response_size = future.get();
2023-04-14 13:32:08 +00:00
auto microseconds = watch.elapsedMicroseconds();
2021-04-13 12:36:47 +00:00
std::lock_guard lock(mutex);
if (request->isReadRequest())
2023-04-14 13:32:08 +00:00
info->addRead(microseconds, 1, request->bytesSize() + response_size);
2021-04-13 12:36:47 +00:00
else
2023-04-14 13:32:08 +00:00
info->addWrite(microseconds, 1, request->bytesSize() + response_size);
2021-04-13 12:36:47 +00:00
}
catch (...)
{
if (!continue_on_error)
{
shutdown = true;
throw;
}
std::cerr << DB::getCurrentExceptionMessage(true, true /*check embedded stack trace*/) << std::endl;
bool got_expired = false;
for (const auto & connection : zookeepers)
{
if (connection->isExpired())
{
got_expired = true;
break;
}
}
if (got_expired)
{
while (true)
{
try
{
2023-04-07 13:02:42 +00:00
zookeepers = refreshConnections();
break;
}
catch (...)
{
std::cerr << DB::getCurrentExceptionMessage(true, true /*check embedded stack trace*/) << std::endl;
}
}
}
2021-04-13 12:36:47 +00:00
}
++requests_executed;
}
}
2023-04-07 14:14:39 +00:00
bool Runner::tryPushRequestInteractively(Coordination::ZooKeeperRequestPtr && request, DB::InterruptListener & interrupt_listener)
2021-04-13 12:36:47 +00:00
{
bool inserted = false;
while (!inserted)
{
2023-04-07 14:14:39 +00:00
inserted = queue->tryPush(std::move(request), 100);
2021-04-13 12:36:47 +00:00
if (shutdown)
{
/// An exception occurred in a worker
return false;
}
if (max_time > 0 && total_watch.elapsedSeconds() >= max_time)
{
2023-04-14 13:32:08 +00:00
std::cerr << "Stopping launch of queries. Requested time limit is exhausted.\n";
2021-04-13 12:36:47 +00:00
return false;
}
if (interrupt_listener.check())
{
2023-04-14 13:32:08 +00:00
std::cerr << "Stopping launch of queries. SIGINT received." << std::endl;
2021-04-13 12:36:47 +00:00
return false;
}
if (delay > 0 && delay_watch.elapsedSeconds() > delay)
{
printNumberOfRequestsExecuted(requests_executed);
std::lock_guard lock(mutex);
2023-04-14 13:32:08 +00:00
info->report(concurrency);
2021-04-13 12:36:47 +00:00
delay_watch.restart();
}
}
return true;
}
void Runner::runBenchmark()
{
2023-04-07 13:02:42 +00:00
createConnections();
std::cerr << "Preparing to run\n";
2023-04-07 13:02:42 +00:00
generator->startup(*connections[0]);
std::cerr << "Prepared\n";
2023-04-17 11:25:46 +00:00
2023-04-17 15:09:35 +00:00
auto start_timestamp_ms = Poco::Timestamp().epochMicroseconds() / 1000;
2023-04-17 11:25:46 +00:00
2021-04-13 12:36:47 +00:00
try
{
for (size_t i = 0; i < concurrency; ++i)
{
2023-04-07 13:02:42 +00:00
auto thread_connections = connections;
2023-09-21 10:54:09 +00:00
pool->scheduleOrThrowOnError([this, connections_ = std::move(thread_connections)]() mutable { thread(connections_); });
2021-04-13 12:36:47 +00:00
}
}
catch (...)
{
shutdown = true;
2023-04-07 14:14:39 +00:00
pool->wait();
2021-04-13 12:36:47 +00:00
throw;
}
DB::InterruptListener interrupt_listener;
delay_watch.restart();
/// Push queries into queue
for (size_t i = 0; !max_iterations || i < max_iterations; ++i)
{
if (!tryPushRequestInteractively(generator->generate(), interrupt_listener))
{
shutdown = true;
break;
}
}
2023-04-07 14:14:39 +00:00
pool->wait();
2021-04-13 12:36:47 +00:00
total_watch.stop();
printNumberOfRequestsExecuted(requests_executed);
std::lock_guard lock(mutex);
2023-04-14 13:32:08 +00:00
info->report(concurrency);
2023-04-17 11:25:46 +00:00
DB::WriteBufferFromOwnString out;
info->writeJSON(out, concurrency, start_timestamp_ms);
auto output_string = std::move(out.str());
if (print_to_stdout)
std::cout << output_string << std::endl;
if (file_output)
{
auto path = *file_output;
if (output_file_with_timestamp)
{
auto filename = file_output->filename();
filename = fmt::format("{}_{}{}", filename.stem().generic_string(), start_timestamp_ms, filename.extension().generic_string());
path = file_output->parent_path() / filename;
}
std::cerr << "Storing output to " << path << std::endl;
DB::WriteBufferFromFile file_output_buffer(path);
DB::ReadBufferFromString read_buffer(output_string);
DB::copyData(read_buffer, file_output_buffer);
}
2021-04-13 12:36:47 +00:00
}
2023-04-07 13:02:42 +00:00
void Runner::createConnections()
2021-04-13 12:36:47 +00:00
{
2023-04-07 14:14:39 +00:00
DB::EventNotifier::init();
2023-04-14 13:32:08 +00:00
std::cerr << "---- Creating connections ---- " << std::endl;
2023-04-07 13:02:42 +00:00
for (size_t connection_info_idx = 0; connection_info_idx < connection_infos.size(); ++connection_info_idx)
{
const auto & connection_info = connection_infos[connection_info_idx];
2023-04-14 13:32:08 +00:00
std::cerr << fmt::format("Creating {} session(s) for:\n"
2023-04-07 13:02:42 +00:00
"- host: {}\n"
"- secure: {}\n"
"- session timeout: {}ms\n"
"- operation timeout: {}ms\n"
"- connection timeout: {}ms",
connection_info.sessions,
connection_info.host,
connection_info.secure,
connection_info.session_timeout_ms,
connection_info.operation_timeout_ms,
connection_info.connection_timeout_ms) << std::endl;
for (size_t session = 0; session < connection_info.sessions; ++session)
{
connections.emplace_back(getConnection(connection_info, connection_info_idx));
2023-04-07 13:02:42 +00:00
connections_to_info_map[connections.size() - 1] = connection_info_idx;
}
2021-04-13 12:36:47 +00:00
}
2023-04-14 13:32:08 +00:00
std::cerr << "---- Done creating connections ----\n" << std::endl;
2023-04-07 13:02:42 +00:00
}
2021-04-13 12:36:47 +00:00
std::shared_ptr<Coordination::ZooKeeper> Runner::getConnection(const ConnectionInfo & connection_info, size_t connection_info_idx)
2023-04-07 13:02:42 +00:00
{
Coordination::ZooKeeper::Node node{Poco::Net::SocketAddress{connection_info.host}, static_cast<UInt8>(connection_info_idx), connection_info.secure};
2023-04-07 13:02:42 +00:00
std::vector<Coordination::ZooKeeper::Node> nodes;
nodes.push_back(node);
zkutil::ZooKeeperArgs args;
args.session_timeout_ms = connection_info.session_timeout_ms;
args.connection_timeout_ms = connection_info.connection_timeout_ms;
args.operation_timeout_ms = connection_info.operation_timeout_ms;
args.use_compression = connection_info.use_compression;
2023-04-07 13:02:42 +00:00
return std::make_shared<Coordination::ZooKeeper>(nodes, args, nullptr);
}
2023-04-07 13:02:42 +00:00
std::vector<std::shared_ptr<Coordination::ZooKeeper>> Runner::refreshConnections()
{
std::lock_guard lock(connection_mutex);
for (size_t connection_idx = 0; connection_idx < connections.size(); ++connection_idx)
{
auto & connection = connections[connection_idx];
if (connection->isExpired())
{
const auto & connection_info = connection_infos[connections_to_info_map[connection_idx]];
connection = getConnection(connection_info, connection_idx);
2023-04-07 13:02:42 +00:00
}
}
return connections;
2021-04-13 12:36:47 +00:00
}
2023-04-07 14:14:39 +00:00
Runner::~Runner()
{
queue->clearAndFinish();
shutdown = true;
pool->wait();
2023-04-07 14:51:25 +00:00
generator->cleanup(*connections[0]);
2023-04-07 14:14:39 +00:00
}