ClickHouse/dbms/src/Client/PerformanceTest.cpp
2017-05-09 21:52:58 +03:00

1266 lines
37 KiB
C++

#include <iostream>
#include <limits>
#include <unistd.h>
#include <sys/stat.h>
#include <boost/program_options.hpp>
#include <DB/AggregateFunctions/ReservoirSampler.h>
#include <DB/Client/ConnectionPool.h>
#include <DB/Common/ConcurrentBoundedQueue.h>
#include <DB/Common/Stopwatch.h>
#include <DB/Common/ThreadPool.h>
#include <DB/Core/Types.h>
#include <DB/DataStreams/RemoteBlockInputStream.h>
#include <DB/Interpreters/Settings.h>
#include <DB/IO/ReadHelpers.h>
#include <DB/IO/ReadBufferFromFileDescriptor.h>
#include <Poco/AutoPtr.h>
#include <Poco/XML/XMLStream.h>
#include <Poco/SAX/InputSource.h>
#include <Poco/Util/XMLConfiguration.h>
#include <Poco/Exception.h>
#include "InterruptListener.h"
/** Tests launcher for ClickHouse.
* The tool walks through given or default folder in order to find files with
* tests' description and launches it.
*/
namespace DB
{
namespace ErrorCodes
{
extern const int POCO_EXCEPTION;
extern const int STD_EXCEPTION;
extern const int UNKNOWN_EXCEPTION;
}
bool isNumber(const std::string & str) {
if (str.empty()) { return false; }
size_t dotsCounter = 0;
if (str[0] == '.' || str[str.size() - 1] == '.') {
return false;
}
for (char chr : str) {
if (chr == '.') {
if (dotsCounter)
return false;
else
++dotsCounter;
continue;
}
if (chr < '0' || chr > '9') {
return false;
}
}
return true;
}
class JSONString {
private:
std::map<std::string, std::string> content;
std::string current_key;
size_t _padding = 1;
public:
JSONString() {};
JSONString(size_t padding): _padding(padding) {};
JSONString & operator[](const std::string & key)
{
current_key = key;
return *this;
}
template <typename T>
typename std::enable_if<std::is_arithmetic<T>::value, JSONString & >::type
operator[](const T key)
{
current_key = std::to_string(key);
return *this;
}
void set(std::string value)
{
if (current_key.empty()) {
throw "cannot use set without key";
}
if (value.empty()) {
value = "null";
}
bool reserved = (value[0] == '[' || value[0] == '{' || value == "null");
if (!reserved && !isNumber(value)) {
value = '\"' + value + '\"';
}
content[current_key] = value;
current_key = "";
}
void set(const JSONString & innerJSON)
{
set(innerJSON.constructOutput());
}
void set(const std::vector<JSONString> & runInfos)
{
if (current_key.empty()) {
throw "cannot use set without key";
}
content[current_key] = "[\n";
for (size_t i = 0; i < runInfos.size(); ++i) {
for (size_t i = 0; i < _padding + 1; ++i) {
content[current_key] += "\t";
}
content[current_key] += runInfos[i].constructOutput(_padding + 2);
if (i != runInfos.size() - 1) {
content[current_key] += ',';
}
content[current_key] += "\n";
}
for (size_t i = 0; i < _padding; ++i) {
content[current_key] += "\t";
}
content[current_key] += ']';
current_key = "";
}
template <typename T>
typename std::enable_if<std::is_arithmetic<T>::value, void>::type set(T value)
{
set(std::to_string(value));
}
std::string constructOutput() const
{
return constructOutput(_padding);
}
std::string constructOutput(size_t padding) const
{
std::string output = "{";
bool first = true;
for (auto it = content.begin(); it != content.end(); ++it) {
if (! first) {
output += ',';
} else {
first = false;
}
output += "\n";
for (size_t i = 0; i < padding; ++i) {
output += "\t";
}
std::string key = '\"' + it->first + '\"';
std::string value = it->second;
output += key + ": " + value;
}
output += "\n";
for (size_t i = 0; i < padding - 1; ++i) {
output += "\t";
}
output += "}";
return output;
}
};
std::ostream & operator<<(std::ostream & stream, const JSONString & jsonObj)
{
stream << jsonObj.constructOutput();
return stream;
}
struct CriterionWithPriority {
std::string priority = "";
size_t value = 0;
bool fulfilled = false;
};
/// Termination criterions. The running test will be terminated in either of two conditions:
/// 1. All criterions marked 'min' are fulfilled
/// or
/// 2. Any criterion marked 'max' is fulfilled
class StopCriterions {
private:
using AbstractConfiguration = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
using Keys = std::vector<std::string>;
void initializeStruct(const std::string priority,
const AbstractConfiguration & stopCriterionsView)
{
Keys keys;
stopCriterionsView->keys(priority, keys);
for (const std::string & key : keys) {
if (key == "timeout_ms") {
timeout_ms.value = stopCriterionsView->getUInt64(priority + ".timeout_ms");
timeout_ms.priority = priority;
} else if (key == "rows_read") {
rows_read.value = stopCriterionsView->getUInt64(priority + ".rows_read");
rows_read.priority = priority;
} else if (key == "bytes_read_uncompressed") {
bytes_read_uncompressed.value = stopCriterionsView->getUInt64(priority + ".bytes_read_uncompressed");
bytes_read_uncompressed.priority = priority;
} else if (key == "iterations") {
iterations.value = stopCriterionsView->getUInt64(priority + ".iterations");
iterations.priority = priority;
} else if (key == "min_time_not_changing_for_ms") {
min_time_not_changing_for_ms.value = stopCriterionsView->getUInt64(priority + ".min_time_not_changing_for_ms");
min_time_not_changing_for_ms.priority = priority;
} else if (key == "max_speed_not_changing_for_ms") {
max_speed_not_changing_for_ms.value = stopCriterionsView->getUInt64(priority + ".max_speed_not_changing_for_ms");
max_speed_not_changing_for_ms.priority = priority;
} else if (key == "average_speed_not_changing_for_ms") {
average_speed_not_changing_for_ms.value = stopCriterionsView->getUInt64(priority + ".average_speed_not_changing_for_ms");
average_speed_not_changing_for_ms.priority = priority;
} else {
throw Poco::Exception("Met unkown stop criterion: " + key, 1);
}
if (priority == "min") { ++number_of_initialized_min; };
if (priority == "max") { ++number_of_initialized_max; };
}
}
public:
StopCriterions()
: number_of_initialized_min(0), number_of_initialized_max(0),
fulfilled_criterions_min(0), fulfilled_criterions_max(0) {}
void loadFromConfig(const AbstractConfiguration & stopCriterionsView)
{
if (stopCriterionsView->has("min")) {
initializeStruct("min", stopCriterionsView);
}
if (stopCriterionsView->has("max")) {
initializeStruct("max", stopCriterionsView);
}
}
void reset()
{
timeout_ms.fulfilled = false;
rows_read.fulfilled = false;
bytes_read_uncompressed.fulfilled = false;
iterations.fulfilled = false;
min_time_not_changing_for_ms.fulfilled = false;
max_speed_not_changing_for_ms.fulfilled = false;
average_speed_not_changing_for_ms.fulfilled = false;
fulfilled_criterions_min = 0;
fulfilled_criterions_max = 0;
}
struct CriterionWithPriority timeout_ms;
struct CriterionWithPriority rows_read;
struct CriterionWithPriority bytes_read_uncompressed;
struct CriterionWithPriority iterations;
struct CriterionWithPriority min_time_not_changing_for_ms;
struct CriterionWithPriority max_speed_not_changing_for_ms;
struct CriterionWithPriority average_speed_not_changing_for_ms;
/// Hereafter 'min' and 'max', in context of critetions, mean a level of importance
/// Number of initialized properties met in configuration
std::atomic<size_t> number_of_initialized_min;
std::atomic<size_t> number_of_initialized_max;
std::atomic<size_t> fulfilled_criterions_min;
std::atomic<size_t> fulfilled_criterions_max;
};
struct Stats
{
Stopwatch watch;
Stopwatch watch_per_query;
Stopwatch min_time_watch;
Stopwatch max_rows_speed_watch;
Stopwatch max_bytes_speed_watch;
Stopwatch avg_rows_speed_watch;
Stopwatch avg_bytes_speed_watch;
size_t queries;
size_t rows_read;
size_t bytes_read;
using Sampler = ReservoirSampler<double>;
Sampler sampler {1 << 16};
/// min_time in ms
UInt64 min_time = std::numeric_limits<UInt64>::max();
double total_time = 0;
double max_rows_speed = 0;
double max_bytes_speed = 0;
double avg_rows_speed_value = 0;
double avg_rows_speed_first = 0;
double avg_rows_speed_precision = 0.001;
double avg_bytes_speed_value = 0;
double avg_bytes_speed_first = 0;
double avg_bytes_speed_precision = 0.001;
size_t number_of_rows_speed_info_batches = 0;
size_t number_of_bytes_speed_info_batches = 0;
std::string getStatisticByName(const std::string & statisticName) {
if (statisticName == "min_time") {
return std::to_string(min_time) + "ms";
}
if (statisticName == "quantiles") {
std::string result = "\n";
for (double percent = 10; percent <= 90; percent += 10) {
result += "\t" + std::to_string((percent / 100));
result += ": " + std::to_string(sampler.quantileInterpolated(percent / 100.0));
result += "\n";
}
result += "\t0.95: " + std::to_string(sampler.quantileInterpolated(95 / 100.0)) + "\n";
result += "\t0.99: " + std::to_string(sampler.quantileInterpolated(99 / 100.0)) + "\n";
result += "\t0.999: " + std::to_string(sampler.quantileInterpolated(99.9 / 100.)) + "\n";
result += "\t0.9999: " + std::to_string(sampler.quantileInterpolated(99.99 / 100.));
return result;
}
if (statisticName == "total_time") {
return std::to_string(total_time) + "s";
}
if (statisticName == "queries_per_second") {
return std::to_string(queries / total_time);
}
if (statisticName == "rows_per_second") {
return std::to_string(rows_read / total_time);
}
if (statisticName == "bytes_per_second") {
return std::to_string(bytes_read / total_time);
}
if (statisticName == "max_rows_per_second") {
return std::to_string(max_rows_speed);
}
if (statisticName == "max_bytes_per_second") {
return std::to_string(max_bytes_speed);
}
if (statisticName == "avg_rows_per_second") {
return std::to_string(avg_rows_speed_value);
}
if (statisticName == "avg_bytes_per_second") {
return std::to_string(avg_bytes_speed_value);
}
return "";
}
void update_min_time(const UInt64 min_time_candidate)
{
if (min_time_candidate < min_time) {
min_time = min_time_candidate;
min_time_watch.restart();
}
}
void update_average_speed(const double new_speed_info, Stopwatch & avg_speed_watch,
size_t & number_of_info_batches, double precision,
double & avg_speed_first, double & avg_speed_value)
{
avg_speed_value = ((avg_speed_value * number_of_info_batches)
+ new_speed_info);
avg_speed_value /= (++number_of_info_batches);
if (avg_speed_first == 0) {
avg_speed_first = avg_speed_value;
}
if (abs(avg_speed_value - avg_speed_first) >= precision) {
avg_speed_first = avg_speed_value;
avg_speed_watch.restart();
}
}
void update_max_speed(const size_t max_speed_candidate, Stopwatch & max_speed_watch,
double & max_speed)
{
if (max_speed_candidate > max_speed) {
max_speed = max_speed_candidate;
max_speed_watch.restart();
}
}
void add(size_t rows_read_inc, size_t bytes_read_inc)
{
rows_read += rows_read_inc;
bytes_read += bytes_read_inc;
double new_rows_speed = rows_read_inc / watch_per_query.elapsedSeconds();
double new_bytes_speed = bytes_read_inc / watch_per_query.elapsedSeconds();
/// Update rows speed
update_max_speed(new_rows_speed, max_rows_speed_watch, max_rows_speed);
update_average_speed(new_rows_speed, avg_rows_speed_watch,
number_of_rows_speed_info_batches, avg_rows_speed_precision,
avg_rows_speed_first, avg_rows_speed_value);
/// Update bytes speed
update_max_speed(new_bytes_speed, max_bytes_speed_watch, max_bytes_speed);
update_average_speed(new_bytes_speed, avg_bytes_speed_watch,
number_of_bytes_speed_info_batches, avg_bytes_speed_precision,
avg_bytes_speed_first, avg_bytes_speed_value);
}
void updateQueryInfo()
{
++queries;
sampler.insert(watch_per_query.elapsedSeconds());
update_min_time(watch_per_query.elapsed() / (1000 * 1000)); /// ns to ms
}
void setTotalTime()
{
total_time = watch.elapsedSeconds();
}
void clear()
{
watch.restart();
watch_per_query.restart();
min_time_watch.restart();
max_rows_speed_watch.restart();
max_bytes_speed_watch.restart();
avg_rows_speed_watch.restart();
avg_bytes_speed_watch.restart();
sampler.clear();
queries = 0;
rows_read = 0;
bytes_read = 0;
min_time = std::numeric_limits<UInt64>::max();
total_time = 0;
max_rows_speed = 0;
max_bytes_speed = 0;
avg_rows_speed_value = 0;
avg_bytes_speed_value = 0;
avg_rows_speed_first = 0;
avg_bytes_speed_first = 0;
avg_rows_speed_precision = 0.001;
avg_bytes_speed_precision = 0.001;
number_of_rows_speed_info_batches = 0;
number_of_bytes_speed_info_batches = 0;
}
};
class PerformanceTest
{
public:
PerformanceTest(
const unsigned concurrency_,
const String & host_,
const UInt16 port_,
const String & default_database_,
const String & user_,
const String & password_,
const std::vector<std::string> & input_files,
const std::vector<std::string> & tags,
const std::vector<std::string> & without_tags,
const std::vector<std::string> & names,
const std::vector<std::string> & without_names,
const std::vector<std::string> & names_regexp,
const std::vector<std::string> & without_names_regexp
):
concurrency(concurrency_), queue(concurrency_),
connections(concurrency, host_, port_, default_database_, user_, password_),
pool(concurrency),
testsConfigurations(input_files.size())
{
if (input_files.size() < 1) {
throw Poco::Exception("No tests were specified", 1);
}
std::cerr << std::fixed << std::setprecision(3);
std::cout << std::fixed << std::setprecision(3);
readTestsConfiguration(input_files);
}
private:
unsigned concurrency;
std::string testName;
using Query = std::string;
using Queries = std::vector<std::string>;
Queries queries;
using Queue = ConcurrentBoundedQueue<Query>;
Queue queue;
using Keys = std::vector<std::string>;
ConnectionPool connections;
ThreadPool pool;
Settings settings;
InterruptListener interrupt_listener;
bool gotSIGINT = false;
std::vector<RemoteBlockInputStream*> streams;
double average_speed_precision = 0.001;
using XMLConfiguration = Poco::Util::XMLConfiguration;
using AbstractConfig = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
using Config = Poco::AutoPtr<XMLConfiguration>;
using Paths = std::vector<std::string>;
using StringToVector = std::map< std::string, std::vector<std::string> >;
StringToVector substitutions;
std::vector<Config> testsConfigurations;
using StringKeyValue = std::map<std::string, std::string>;
std::vector<StringKeyValue> substitutionsMaps;
struct StopCriterions stopCriterions;
#define incFulfilledCriterions(CRITERION) \
if (! stopCriterions.CRITERION.fulfilled) {\
stopCriterions.CRITERION.priority == "min" \
? ++stopCriterions.fulfilled_criterions_min \
: ++stopCriterions.fulfilled_criterions_max; \
stopCriterions.CRITERION.fulfilled = true; \
}
enum ExecutionType { loop, once };
ExecutionType execType;
size_t timesToRun = 1;
std::vector<Stats> statistics;
std::mutex mutex;
void readTestsConfiguration(const Paths & input_files)
{
testsConfigurations.resize(input_files.size());
for (size_t i = 0; i != input_files.size(); ++i) {
const std::string path = input_files[i];
testsConfigurations[i] = Config(new XMLConfiguration(path));
}
// TODO: here will be tests filter on tags, names, regexp matching, etc.
// { ... }
// for now let's launch one test only
if (testsConfigurations.size()) {
for (auto & testConfig : testsConfigurations) {
runTest(testConfig);
}
}
}
void runTest(Config & testConfig)
{
testName = testConfig->getString("name");
std::cout << "Running: " << testName << "\n";
/// Preprocess configuration file
if (testConfig->has("settings")) {
Keys configSettings;
testConfig->keys("settings", configSettings);
/// This macro goes through all settings in the Settings.h
/// and, if found any settings in test's xml configuration
/// with the same name, sets its value to settings
std::vector<std::string>::iterator it;
#define EXTRACT_SETTING(TYPE, NAME, DEFAULT) \
it = std::find(configSettings.begin(), configSettings.end(), #NAME); \
if (it != configSettings.end()) \
settings.set( \
#NAME, testConfig->getString("settings."#NAME) \
);
APPLY_FOR_SETTINGS(EXTRACT_SETTING)
APPLY_FOR_LIMITS(EXTRACT_SETTING)
#undef EXTRACT_SETTING
if (std::find(configSettings.begin(), configSettings.end(), "profile") !=
configSettings.end()) {
// TODO: proceed profile settings in a proper way
}
if (std::find(configSettings.begin(), configSettings.end(),
"average_rows_speed_precision") != configSettings.end()) {
statistics.back().avg_rows_speed_precision = testConfig->getDouble("settings.average_rows_speed_precision");
}
if (std::find(configSettings.begin(), configSettings.end(),
"average_bytes_speed_precision") != configSettings.end()) {
statistics.back().avg_bytes_speed_precision = testConfig->getDouble("settings.average_bytes_speed_precision");
}
}
Query query;
if (! testConfig->has("query")) {
throw Poco::Exception("Missing query field in test's config: " +
testName, 1);
}
query = testConfig->getString("query");
if (query.empty()) {
throw Poco::Exception("The query is empty in test's config: " +
testName, 1);
}
if (testConfig->has("substitutions")) {
/// Make "subconfig" of inner xml block
AbstractConfig substitutionsView(testConfig
->createView("substitutions"));
constructSubstitutions(substitutionsView, substitutions);
queries = formatQueries(query, substitutions);
} else {
// TODO: probably it will be a good practice to check if
// query string has {substitution pattern}, but no substitution field
// was found in xml configuration
queries.push_back(query);
}
if (! testConfig->has("type")) {
throw Poco::Exception("Missing type property in config: " +
testName);
}
std::string configExecType = testConfig->getString("type");
if (configExecType == "loop")
execType = loop;
else if (configExecType == "once")
execType = once;
else
throw Poco::Exception("Unknown type " + configExecType + " in :" +
testName, 1);
if (testConfig->has("stop")) {
AbstractConfig stopCriterionsView(testConfig
->createView("stop"));
stopCriterions.loadFromConfig(stopCriterionsView);
} else {
throw Poco::Exception("No termination conditions were found", 1);
}
if (testConfig->has("timesToRun")) {
timesToRun = testConfig->getUInt("timesToRun");
}
for (size_t numberOfLaunch = 0; numberOfLaunch < timesToRun; ++numberOfLaunch) {
stopCriterions.reset();
statistics.emplace_back();
if (execType == loop) {
runLoopQuery(queries[0]);
} else {
runQueries(queries);
}
statistics.back().setTotalTime();
}
AbstractConfig metricsView(testConfig->createView("metric"));
Keys metrics;
metricsView->keys(metrics);
if (metrics.size() > 1) {
throw Poco::Exception("More than 1 main metric is not allowed");
}
if (metrics.size() == 1) {
checkMetricInput(metrics[0]);
minOutput(metrics[0]);
} else {
constructTotalInfo();
}
}
void checkMetricInput(const std::string & main_metric) const {
std::vector<std::string> loopMetrics = {
"min_time", "quantiles", "total_time", "queries_per_second",
"rows_per_second", "bytes_per_second"
};
std::vector<std::string> infiniteMetrics = {
"max_rows_per_second", "max_bytes_per_second", "avg_rows_per_second",
"avg_bytes_per_second"
};
if (execType == loop) {
if (std::find(infiniteMetrics.begin(), infiniteMetrics.end(), main_metric) != infiniteMetrics.end()) {
throw Poco::Exception("Wrong type of main metric for loop "
"execution type");
}
} else {
if (std::find(loopMetrics.begin(), loopMetrics.end(), main_metric) != loopMetrics.end()) {
throw Poco::Exception("Wrong type of main metric for "
"inifinite execution type");
}
}
}
void runLoopQuery(const Query & query)
{
statistics.back().clear();
size_t max_iterations = stopCriterions.iterations.value;
size_t i = -1;
while (! gotSIGINT) {
++i;
pool.schedule(std::bind(
&PerformanceTest::thread,
this,
connections.IConnectionPool::get()
));
queue.push(query);
queue.push(""); /// asking thread to stop
pool.wait();
/// check stop criterions
if (max_iterations && i >= max_iterations) {
incFulfilledCriterions(iterations);
}
if (stopCriterions.number_of_initialized_min &&
(stopCriterions.fulfilled_criterions_min >=
stopCriterions.number_of_initialized_min)) {
/// All 'min' criterions are fulfilled
// TODO:
std::cout << "All 'min' criterions are fulfilled" << std::endl;
break;
}
if (stopCriterions.number_of_initialized_max &&
stopCriterions.fulfilled_criterions_max) {
/// Some 'max' criterions are fulfilled
// TODO:
std::cout << stopCriterions.fulfilled_criterions_max
<< "'max' criterions are fulfilled" << std::endl;
break;
}
}
}
void runQueries(const Queries & queries)
{
statistics.back().clear();
for (size_t i = 0; i < concurrency; ++i) {
pool.schedule(std::bind(
&PerformanceTest::thread,
this,
connections.IConnectionPool::get()
));
}
for (const Query & query : queries) {
queue.push(query);
}
for (size_t i = 0; i != concurrency; ++i) {
/// Genlty asking threads to stop
queue.push("");
}
pool.wait();
}
void thread(ConnectionPool::Entry & connection)
{
Query query;
while (true) {
queue.pop(query);
/// Empty query means end of execution
if (query.empty())
break;
execute(connection, query);
}
}
void execute(ConnectionPool::Entry & connection, const Query & query)
{
InterruptListener thread_interrupt_listener;
statistics.back().watch_per_query.restart();
RemoteBlockInputStream * stream = new RemoteBlockInputStream(
connection, query, &settings, nullptr, Tables()/*, query_processing_stage*/
);
size_t stream_index;
{
std::lock_guard<std::mutex> lock(mutex);
streams.push_back(stream);
stream_index = streams.size() - 1;
}
Progress progress;
stream->setProgressCallback(
[&progress, &stream, &thread_interrupt_listener, this]
(const Progress & value) {
progress.incrementPiecewiseAtomically(value);
this->checkFulfilledCriterionsAndUpdate(progress, stream, thread_interrupt_listener);
});
stream->readPrefix();
while (Block block = stream->read())
;
stream->readSuffix();
std::lock_guard<std::mutex> lock(mutex);
streams.erase(streams.begin() + stream_index);
delete stream;
statistics.back().updateQueryInfo();
// const BlockStreamProfileInfo & info = stream->getProfileInfo();
// double seconds = watch.elapsedSeconds();
// std::lock_guard<std::mutex> lock(mutex);
// info_per_interval.add(seconds, progress.rows, progress.bytes, info.rows, info.bytes);
// statistics.back().add(seconds, progress.rows, progress.bytes, info.rows, info.bytes);
}
void checkFulfilledCriterionsAndUpdate(const Progress & progress,
RemoteBlockInputStream * stream,
InterruptListener & thread_interrupt_listener)
{
std::lock_guard<std::mutex> lock(mutex);
statistics.back().add(progress.rows, progress.bytes);
size_t max_rows_to_read = stopCriterions.rows_read.value;
if (max_rows_to_read && statistics.back().rows_read >= max_rows_to_read) {
incFulfilledCriterions(rows_read);
}
size_t max_bytes_to_read = stopCriterions.bytes_read_uncompressed.value;
if (max_bytes_to_read && statistics.back().bytes_read >= max_bytes_to_read) {
incFulfilledCriterions(bytes_read_uncompressed);
}
if (UInt64 max_timeout_ms = stopCriterions.timeout_ms.value) {
/// cast nanoseconds to ms
if ((statistics.back().watch.elapsed() / (1000 * 1000)) > max_timeout_ms) {
incFulfilledCriterions(timeout_ms);
}
}
size_t min_time_not_changing_for_ms = stopCriterions
.min_time_not_changing_for_ms.value;
if (min_time_not_changing_for_ms) {
size_t min_time_did_not_change_for = statistics.back()
.min_time_watch
.elapsed() / (1000 * 1000);
if (min_time_did_not_change_for >= min_time_not_changing_for_ms) {
incFulfilledCriterions(min_time_not_changing_for_ms);
}
}
size_t max_speed_not_changing_for_ms = stopCriterions
.max_speed_not_changing_for_ms
.value;
if (max_speed_not_changing_for_ms) {
UInt64 speed_not_changing_time = statistics.back()
.max_rows_speed_watch
.elapsed() / (1000 * 1000);
if (speed_not_changing_time >= max_speed_not_changing_for_ms) {
incFulfilledCriterions(max_speed_not_changing_for_ms);
}
}
size_t average_speed_not_changing_for_ms = stopCriterions
.average_speed_not_changing_for_ms
.value;
if (average_speed_not_changing_for_ms) {
UInt64 speed_not_changing_time = statistics.back()
.avg_rows_speed_watch
.elapsed() / (1000 * 1000);
if (speed_not_changing_time >= average_speed_not_changing_for_ms) {
incFulfilledCriterions(average_speed_not_changing_for_ms);
}
}
if (stopCriterions.number_of_initialized_min &&
(stopCriterions.fulfilled_criterions_min >=
stopCriterions.number_of_initialized_min)) {
/// All 'min' criterions are fulfilled
// TODO:
std::cout << "All 'min' criterions are fulfilled" << std::endl;
stream->cancel();
}
if (stopCriterions.number_of_initialized_max &&
stopCriterions.fulfilled_criterions_max) {
/// Some 'max' criterions are fulfilled
// TODO:
std::cout << stopCriterions.fulfilled_criterions_max
<< "'max' criterions are fulfilled" << std::endl;
stream->cancel();
}
if (thread_interrupt_listener.check()) { /// SIGINT
gotSIGINT = true;
for (RemoteBlockInputStream * stream : streams) {
stream->cancel();
}
std::cout << "got SIGNINT; stopping streams" << std::endl;
}
}
void constructSubstitutions(AbstractConfig & substitutionsView,
StringToVector & substitutions)
{
Keys xml_substitutions;
substitutionsView->keys(xml_substitutions);
for (size_t i = 0; i != xml_substitutions.size(); ++i) {
const AbstractConfig xml_substitution(
substitutionsView->createView("substitution[" +
std::to_string(i) + "]")
);
/// Property values for substitution will be stored in a vector
/// accessible by property name
std::vector<std::string> xml_values;
xml_substitution->keys("values", xml_values);
std::string name = xml_substitution->getString("name");
for (size_t j = 0; j != xml_values.size(); ++j) {
substitutions[name].push_back(
xml_substitution->getString("values.value[" +
std::to_string(j) + "]")
);
}
}
}
std::vector<std::string> formatQueries(const std::string & query,
StringToVector substitutions)
{
std::vector<std::string> queries;
StringToVector::iterator substitutions_first = substitutions.begin();
StringToVector::iterator substitutions_last = substitutions.end();
--substitutions_last;
std::map<std::string, std::string> substitutionsMap;
runThroughAllOptionsAndPush(
substitutions_first, substitutions_last, query, queries, substitutionsMap
);
return queries;
}
/// Recursive method which goes through all substitution blocks in xml
/// and replaces property {names} by their values
void runThroughAllOptionsAndPush(
StringToVector::iterator substitutions_left,
StringToVector::iterator substitutions_right,
const std::string & template_query,
std::vector<std::string> & queries,
const StringKeyValue & templateSubstitutionsMap = StringKeyValue()
)
{
std::string name = substitutions_left->first;
std::vector<std::string> values = substitutions_left->second;
for (const std::string & value : values) {
/// Copy query string for each unique permutation
Query query = template_query;
StringKeyValue substitutionsMap = templateSubstitutionsMap;
size_t substrPos = 0;
while (substrPos != std::string::npos) {
substrPos = query.find("{" + name + "}");
if (substrPos != std::string::npos) {
query.replace(
substrPos, 1 + name.length() + 1,
value
);
}
}
substitutionsMap[name] = value;
/// If we've reached the end of substitution chain
if (substitutions_left == substitutions_right) {
queries.push_back(query);
substitutionsMaps.push_back(substitutionsMap);
} else {
StringToVector::iterator next_it = substitutions_left;
++next_it;
runThroughAllOptionsAndPush(
next_it, substitutions_right, query, queries, substitutionsMap
);
}
}
}
public:
void constructTotalInfo()
{
JSONString jsonOutput;
std::string hostname = "";
char hostname_buffer[256];
if (gethostname(hostname_buffer, 256) == 0) {
hostname = std::string(hostname_buffer);
}
jsonOutput["hostname"].set(hostname);
jsonOutput["Number of CPUs: "].set(sysconf(_SC_NPROCESSORS_ONLN));
jsonOutput["test_name"].set(testName);
if (substitutions.size()) {
JSONString jsonParameters;
for (auto it = substitutions.begin(); it != substitutions.end(); ++it) {
std::string parameter = it->first;
std::vector<std::string> values = it->second;
std::string arrayString = "[";
for (size_t i = 0; i != values.size(); ++i) {
arrayString += '\"' + values[i] + '\"';
if (i != values.size() - 1) {
arrayString += ", ";
}
}
arrayString += ']';
jsonParameters[parameter].set(arrayString);
}
jsonOutput["parameters"].set(jsonParameters);
}
std::vector<JSONString> runInfos(timesToRun);
for (size_t numberOfLaunch = 0; numberOfLaunch < timesToRun; ++numberOfLaunch) {
JSONString runJSON;
if (execType == loop) {
runJSON["min_time"].set(std::to_string(statistics[numberOfLaunch].min_time / 1000)
+ "." + std::to_string(statistics[numberOfLaunch].min_time % 1000) + "s");
JSONString quantiles(4); /// here, 4 is the size of \t padding
for (double percent = 10; percent <= 90; percent += 10) {
quantiles[percent / 100].set(statistics[numberOfLaunch].sampler.quantileInterpolated(percent / 100.0));
}
quantiles[0.95].set(statistics[numberOfLaunch].sampler.quantileInterpolated(95 / 100.0));
quantiles[0.99].set(statistics[numberOfLaunch].sampler.quantileInterpolated(99 / 100.0));
quantiles[0.999].set(statistics[numberOfLaunch].sampler.quantileInterpolated(99.9 / 100.0));
quantiles[0.9999].set(statistics[numberOfLaunch].sampler.quantileInterpolated(99.99 / 100.0));
runJSON["quantiles"].set(quantiles);
runJSON["total_time"].set(std::to_string(statistics[numberOfLaunch].total_time) + "s");
runJSON["queries_per_second"].set(double(statistics[numberOfLaunch].queries) / statistics[numberOfLaunch].total_time);
runJSON["rows_per_second"].set(double(statistics[numberOfLaunch].rows_read) / statistics[numberOfLaunch].total_time);
runJSON["bytes_per_second"].set(double(statistics[numberOfLaunch].bytes_read) / statistics[numberOfLaunch].total_time);
} else {
runJSON["max_rows_per_second"].set(statistics[numberOfLaunch].max_rows_speed);
runJSON["max_bytes_per_second"].set(statistics[numberOfLaunch].max_bytes_speed);
runJSON["avg_rows_per_second"].set(statistics[numberOfLaunch].avg_rows_speed_value);
runJSON["avg_bytes_per_second"].set(statistics[numberOfLaunch].avg_bytes_speed_value);
}
runInfos[numberOfLaunch] = runJSON;
}
jsonOutput["runs"].set(runInfos);
std::cout << jsonOutput << std::endl;
}
void minOutput(const std::string & main_metric)
{
// TODO: remove
std::cout << "test" << std::endl;
for (size_t numberOfLaunch = 0; numberOfLaunch < timesToRun; ++numberOfLaunch) {
std::cout << "run " << numberOfLaunch + 1 << ": ";
std::cout << main_metric << " = " << statistics[numberOfLaunch].getStatisticByName(main_metric);
std::cout << std::endl;
}
}
};
}
int mainEntryClickhousePerformanceTest(int argc, char ** argv) {
using namespace DB;
try
{
using boost::program_options::value;
using Strings = std::vector<std::string>;
boost::program_options::options_description desc("Allowed options");
desc.add_options()
("help", "produce help message")
("concurrency,c", value<unsigned>()->default_value(1), "number of parallel queries")
("host,h", value<std::string>()->default_value("localhost"), "")
("port", value<UInt16>()->default_value(9000), "")
("user", value<std::string>()->default_value("default"), "")
("password", value<std::string>()->default_value(""), "")
("database", value<std::string>()->default_value("default"), "")
("tag", value<Strings>(), "Run only tests with tag")
("without-tag", value<Strings>(), "Do not run tests with tag")
("name", value<Strings>(), "Run tests with specific name")
("without-name", value<Strings>(), "Do not run tests with name")
("name-regexp", value<Strings>(), "Run tests with names matching regexp")
("without-name-regexp", value<Strings>(), "Do not run tests with names matching regexp")
;
/// These options will not be displayed in --help
boost::program_options::options_description hidden("Hidden options");
hidden.add_options()
("input-files", value< std::vector<std::string> >(), "")
;
/// But they will be legit, though. And they must be given without name
boost::program_options::positional_options_description positional;
positional.add("input-files", -1);
boost::program_options::options_description cmdline_options;
cmdline_options.add(desc).add(hidden);
boost::program_options::variables_map options;
boost::program_options::store(
boost::program_options::command_line_parser(argc, argv)
.options(cmdline_options)
.positional(positional)
.run(),
options
);
boost::program_options::notify(options);
if (options.count("help"))
{
std::cout << "Usage: " << argv[0] << " [options] [test_file ...] [tests_folder]\n";
std::cout << desc << "\n";
return 1;
}
if (! options.count("input-files")) {
std::cerr << "No tests files were specified. See --help" << "\n";
return 1;
}
Strings tests_tags;
Strings skip_tags;
Strings tests_names;
Strings skip_names;
Strings name_regexp;
Strings skip_matching_regexp;
if (options.count("tag")) {
tests_tags = options["tag"].as<Strings>();
}
if (options.count("without-tag")) {
skip_tags = options["without-tag"].as<Strings>();
}
if (options.count("name")) {
tests_names = options["name"].as<Strings>();
}
if (options.count("without-name")) {
skip_names = options["without-name"].as<Strings>();
}
if (options.count("name-regexp")) {
name_regexp = options["name-regexp"].as<Strings>();
}
if (options.count("without-name-regexp")) {
skip_matching_regexp = options["without-name-regexp"].as<Strings>();
}
PerformanceTest performanceTest(
options["concurrency"].as<unsigned>(),
options["host" ].as<std::string>(),
options["port" ].as<UInt16>(),
options["database" ].as<std::string>(),
options["user" ].as<std::string>(),
options["password" ].as<std::string>(),
options["input-files"].as<Strings>(),
tests_tags,
skip_tags,
tests_names,
skip_names,
name_regexp,
skip_matching_regexp
);
}
catch (const Exception & e)
{
std::string text = e.displayText();
std::cerr << "Code: " << e.code() << ". " << text << "\n\n";
/// Если есть стек-трейс на сервере, то не будем писать стек-трейс на клиенте.
if (std::string::npos == text.find("Stack trace"))
std::cerr << "Stack trace:\n"
<< e.getStackTrace().toString();
return e.code();
}
catch (const Poco::Exception & e)
{
std::cerr << "Poco::Exception: " << e.displayText() << "\n";
return ErrorCodes::POCO_EXCEPTION;
}
catch (const std::exception & e)
{
std::cerr << "std::exception: " << e.what() << "\n";
return ErrorCodes::STD_EXCEPTION;
}
catch (...)
{
std::cerr << "Unknown exception\n";
return ErrorCodes::UNKNOWN_EXCEPTION;
}
return 0;
}