ClickHouse/dbms/src/Client/PerformanceTest.cpp

489 lines
14 KiB
C++
Raw Normal View History

2017-01-13 18:26:51 +00:00
#include <iostream>
2017-01-20 12:36:16 +00:00
#include <sys/stat.h>
#include <boost/program_options.hpp>
#include <DB/Client/ConnectionPool.h>
2017-01-20 12:36:16 +00:00
#include <DB/Common/ThreadPool.h>
#include <DB/Common/ConcurrentBoundedQueue.h>
2017-01-20 12:36:16 +00:00
#include <DB/Core/Types.h>
#include <DB/DataStreams/RemoteBlockInputStream.h>
#include <DB/Interpreters/Settings.h>
2017-01-20 12:36:16 +00:00
#include <DB/IO/ReadHelpers.h>
#include <DB/IO/ReadBufferFromFileDescriptor.h>
2017-01-20 12:36:16 +00:00
#include <Poco/AutoPtr.h>
#include <Poco/XML/XMLStream.h>
#include <Poco/SAX/InputSource.h>
#include <Poco/Util/XMLConfiguration.h>
#include <Poco/Exception.h>
2017-01-13 18:26:51 +00:00
/** Tests launcher for ClickHouse.
* The tool walks through given or default folder in order to find files with
* tests' description and launches it.
*/
namespace DB
{
namespace ErrorCodes
{
extern const int POCO_EXCEPTION;
extern const int STD_EXCEPTION;
extern const int UNKNOWN_EXCEPTION;
}
class PerformanceTest
{
public:
2017-01-20 12:36:16 +00:00
PerformanceTest(
const unsigned concurrency_,
const String & host_,
const UInt16 port_,
const String & default_database_,
const String & user_,
const String & password_,
const std::vector<std::string> & input_files,
const std::vector<std::string> & tags,
const std::vector<std::string> & without_tags,
const std::vector<std::string> & names,
const std::vector<std::string> & without_names,
const std::vector<std::string> & names_regexp,
const std::vector<std::string> & without_names_regexp
2017-01-20 12:36:16 +00:00
):
concurrency(concurrency_), queue(concurrency_),
2017-01-20 12:36:16 +00:00
connections(concurrency, host_, port_, default_database_, user_, password_),
pool(concurrency),
testsConfigurations(input_files.size())
2017-01-13 18:26:51 +00:00
{
2017-01-20 12:36:16 +00:00
if (input_files.size() < 1) {
throw Poco::Exception("No tests were specified", 1);
}
2017-01-13 18:26:51 +00:00
// std::cerr << std::fixed << std::setprecision(3);
2017-01-20 12:36:16 +00:00
readTestsConfiguration(input_files);
2017-01-13 18:26:51 +00:00
}
private:
2017-01-20 12:36:16 +00:00
unsigned concurrency;
size_t max_iterations = 1;
using Query = std::string;
using Queries = std::vector<std::string>;
Queries queries;
using Queue = ConcurrentBoundedQueue<Query>;
Queue queue;
2017-01-20 12:36:16 +00:00
ConnectionPool connections;
ThreadPool pool;
Settings settings;
2017-01-20 12:36:16 +00:00
using XMLConfiguration = Poco::Util::XMLConfiguration;
using AbstractConfig = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
using Config = Poco::AutoPtr<XMLConfiguration>;
using Paths = std::vector<std::string>;
using StringToVector = std::map< std::string, std::vector<std::string> >;
2017-01-20 12:36:16 +00:00
std::vector<Config> testsConfigurations;
enum ExecutionType { loop, once };
ExecutionType execType;
void readTestsConfiguration(const Paths & input_files)
2017-01-20 12:36:16 +00:00
{
testsConfigurations.resize(input_files.size());
for (size_t i = 0; i != input_files.size(); ++i) {
const std::string path = input_files[i];
testsConfigurations[i] = Config(new XMLConfiguration(path));
2017-01-20 12:36:16 +00:00
}
// TODO: here will be tests filter on tags, names, regexp matching, etc.
2017-01-20 12:36:16 +00:00
// { ... }
// for now let's launch one test only
if (testsConfigurations.size()) {
for (auto & testConfig : testsConfigurations) {
runTest(testConfig);
}
}
}
void runTest(Config & testConfig)
{
std::string testName = testConfig->getString("name");
std::cout << "Running: " << testName << "\n";
/// Preprocess configuration file
using Keys = std::vector<std::string>;
if (testConfig->has("settings")) {
Keys configSettings;
testConfig->keys("settings", configSettings);
/// This macro goes through all settings in the Settings.h
/// and, if found any settings in test's xml configuration
/// with the same name, sets its value to settings
std::vector<std::string>::iterator it;
#define EXTRACT_SETTING(TYPE, NAME, DEFAULT) \
it = std::find(configSettings.begin(), configSettings.end(), #NAME); \
if (it != configSettings.end()) \
settings.set( \
#NAME, testConfig->getString("settings."#NAME) \
);
APPLY_FOR_SETTINGS(EXTRACT_SETTING)
APPLY_FOR_LIMITS(EXTRACT_SETTING)
#undef EXTRACT_SETTING
if (std::find(configSettings.begin(), configSettings.end(), "profile") !=
configSettings.end()) {
// TODO: proceed profile settings in a proper way
}
}
Query query;
if (! testConfig->has("query")) {
throw Poco::Exception("Missing query field in test's config: " +
testName, 1);
}
query = testConfig->getString("query");
if (query.empty()) {
throw Poco::Exception("The query is empty in test's config: " +
testName, 1);
}
if (testConfig->has("substitutions")) {
/// Make "subconfig" of inner xml block
AbstractConfig substitutionsView(testConfig
->createView("substitutions"));
StringToVector substitutions;
constructSubstitutions(substitutionsView, substitutions);
queries = formatQueries(query, substitutions);
} else {
// TODO: probably it will be a good practice to check if
// query string has {substitution pattern}, but no substitution field
// was found in xml configuration
queries.push_back(query);
}
if (! testConfig->has("type")) {
throw Poco::Exception("Missing type property in config: " +
testName);
}
std::string configExecType = testConfig->getString("type");
if (configExecType == "loop")
execType = loop;
else if (configExecType == "once")
execType = once;
else
throw Poco::Exception("Unknown type " + configExecType + " in :" +
testName, 1);
for (const Query & query : queries) {
std::cout << query << std::endl;
runQuery(query);
}
}
void runQuery(const Query & query)
{
// TODO: proceed terminationConditions
for (size_t i = 0; i < concurrency; ++i) {
pool.schedule(std::bind(
&PerformanceTest::thread,
this,
connections.IConnectionPool::get()
));
}
for (size_t i = 0; (execType == loop) || i < max_iterations; ++i) {
// TODO: start timer and terminate after time exceeds
queue.push(query);
}
for (size_t i = 0; i != concurrency; ++i) {
/// Genlty asking threads to stop
queue.push("");
}
pool.wait();
}
void thread(ConnectionPool::Entry & connection)
{
Query query;
while (true) {
queue.pop(query);
/// Empty query means end of execution
if (query.empty())
break;
execute(connection, query);
}
2017-01-20 12:36:16 +00:00
}
void execute(ConnectionPool::Entry & connection, const Query & query)
{
// Stopwatch watch;
RemoteBlockInputStream stream(connection, query, &settings, nullptr,
Tables()/*, query_processing_stage*/);
// Progress progress;
// stream.setProgressCallback([&progress](const Progress & value) { progress.incrementPiecewiseAtomically(value); });
stream.readPrefix();
while (Block block = stream.read()) //{}
for (auto column : block.getColumns()) {
std::cout << column.name << std::endl;
}
stream.readSuffix();
// const BlockStreamProfileInfo & info = stream.getProfileInfo();
// double seconds = watch.elapsedSeconds();
// std::lock_guard<std::mutex> lock(mutex);
// info_per_interval.add(seconds, progress.rows, progress.bytes, info.rows, info.bytes);
// info_total.add(seconds, progress.rows, progress.bytes, info.rows, info.bytes);
}
void constructSubstitutions(AbstractConfig & substitutionsView,
StringToVector & substitutions)
{
using Keys = std::vector<std::string>;
Keys xml_substitutions;
substitutionsView->keys(xml_substitutions);
for (size_t i = 0; i != xml_substitutions.size(); ++i) {
const AbstractConfig xml_substitution(
substitutionsView->createView("substitution[" +
std::to_string(i) + "]")
);
/// Property values for substitution will be stored in a vector
/// accessible by property name
std::vector<std::string> xml_values;
xml_substitution->keys("values", xml_values);
std::string name = xml_substitution->getString("name");
for (size_t j = 0; j != xml_values.size(); ++j) {
substitutions[name].push_back(
xml_substitution->getString("values.value[" +
std::to_string(j) + "]")
);
}
}
}
2017-01-20 12:36:16 +00:00
std::vector<std::string> formatQueries(const std::string & query,
StringToVector substitutions) const
{
std::vector<std::string> queries;
StringToVector::iterator substitutions_first = substitutions.begin();
StringToVector::iterator substitutions_last = substitutions.end();
--substitutions_last;
runThroughAllOptionsAndPush(
substitutions_first, substitutions_last, query, queries
);
return queries;
}
/// Recursive method which goes through all substitution blocks in xml
/// and replaces property {names} by their values
void runThroughAllOptionsAndPush(
StringToVector::iterator substitutions_left,
StringToVector::iterator substitutions_right,
const std::string & template_query,
std::vector<std::string> & queries
) const
{
std::string name = substitutions_left->first;
std::vector<std::string> values = substitutions_left->second;
for (auto value = values.begin(); value != values.end(); ++value) {
/// Copy query string for each unique permutation
Query query = template_query;
size_t substrPos = 0;
while (substrPos != std::string::npos) {
substrPos = query.find("{" + name + "}");
if (substrPos != std::string::npos) {
query.replace(
substrPos, 1 + name.length() + 1,
*value
);
}
}
/// If we've reached the end of substitution chain
if (substitutions_left == substitutions_right) {
queries.push_back(query);
} else {
StringToVector::iterator next_it = substitutions_left;
++next_it;
runThroughAllOptionsAndPush(
next_it, substitutions_right, query, queries
);
}
}
}
2017-01-13 18:26:51 +00:00
};
}
2017-01-13 18:26:51 +00:00
int mainEntryClickhousePerformanceTest(int argc, char ** argv) {
2017-01-20 12:36:16 +00:00
using namespace DB;
try
{
using boost::program_options::value;
using Strings = std::vector<std::string>;
boost::program_options::options_description desc("Allowed options");
desc.add_options()
("help", "produce help message")
("concurrency,c", value<unsigned>()->default_value(1), "number of parallel queries")
("host,h", value<std::string>()->default_value("localhost"), "")
("port", value<UInt16>()->default_value(9000), "")
("user", value<std::string>()->default_value("default"), "")
("password", value<std::string>()->default_value(""), "")
("database", value<std::string>()->default_value("default"), "")
("tag", value<Strings>(), "Run only tests with tag")
("without-tag", value<Strings>(), "Do not run tests with tag")
("name", value<Strings>(), "Run tests with specific name")
("without-name", value<Strings>(), "Do not run tests with name")
("name-regexp", value<Strings>(), "Run tests with names matching regexp")
("without-name-regexp", value<Strings>(), "Do not run tests with names matching regexp")
;
2017-01-20 12:36:16 +00:00
/// These options will not be displayed in --help
boost::program_options::options_description hidden("Hidden options");
hidden.add_options()
("input-files", value< std::vector<std::string> >(), "")
;
/// But they will be legit, though. And they must be given without name
boost::program_options::positional_options_description positional;
positional.add("input-files", -1);
boost::program_options::options_description cmdline_options;
cmdline_options.add(desc).add(hidden);
boost::program_options::variables_map options;
boost::program_options::store(
boost::program_options::command_line_parser(argc, argv)
.options(cmdline_options)
.positional(positional)
.run(),
options
);
boost::program_options::notify(options);
if (options.count("help"))
{
std::cout << "Usage: " << argv[0] << " [options] [test_file ...] [tests_folder]\n";
std::cout << desc << "\n";
return 1;
}
if (! options.count("input-files")) {
std::cerr << "No tests files were specified. See --help" << "\n";
return 1;
}
Strings tests_tags;
Strings skip_tags;
Strings tests_names;
Strings skip_names;
Strings name_regexp;
Strings skip_matching_regexp;
if (options.count("tag")) {
tests_tags = options["tag"].as<Strings>();
}
if (options.count("without-tag")) {
skip_tags = options["without-tag"].as<Strings>();
}
if (options.count("name")) {
tests_names = options["name"].as<Strings>();
}
if (options.count("without-name")) {
skip_names = options["without-name"].as<Strings>();
}
if (options.count("name-regexp")) {
name_regexp = options["name-regexp"].as<Strings>();
}
if (options.count("without-name-regexp")) {
skip_matching_regexp = options["without-name-regexp"].as<Strings>();
}
PerformanceTest performanceTest(
options["concurrency"].as<unsigned>(),
options["host" ].as<std::string>(),
options["port" ].as<UInt16>(),
options["database" ].as<std::string>(),
options["user" ].as<std::string>(),
options["password" ].as<std::string>(),
options["input-files"].as<Strings>(),
tests_tags,
skip_tags,
tests_names,
skip_names,
name_regexp,
skip_matching_regexp
2017-01-20 12:36:16 +00:00
);
}
catch (const Exception & e)
{
std::string text = e.displayText();
std::cerr << "Code: " << e.code() << ". " << text << "\n\n";
/// Если есть стек-трейс на сервере, то не будем писать стек-трейс на клиенте.
if (std::string::npos == text.find("Stack trace"))
std::cerr << "Stack trace:\n"
<< e.getStackTrace().toString();
return e.code();
}
catch (const Poco::Exception & e)
{
std::cerr << "Poco::Exception: " << e.displayText() << "\n";
return ErrorCodes::POCO_EXCEPTION;
}
catch (const std::exception & e)
{
std::cerr << "std::exception: " << e.what() << "\n";
return ErrorCodes::STD_EXCEPTION;
}
catch (...)
{
std::cerr << "Unknown exception\n";
return ErrorCodes::UNKNOWN_EXCEPTION;
}
return 0;
2017-01-13 18:26:51 +00:00
}