ClickHouse/docker/test/performance-comparison/perf.py

#!/usr/bin/python3

import os
import sys
import itertools
import clickhouse_driver
import xml.etree.ElementTree as et
import argparse
import pprint
import time
import traceback

stage_start_seconds = time.perf_counter()

def report_stage_end(stage_name):
    global stage_start_seconds
    print('{}\t{}'.format(stage_name, time.perf_counter() - stage_start_seconds))
    stage_start_seconds = time.perf_counter()

report_stage_end('start')

parser = argparse.ArgumentParser(description='Run performance test.')
# Explicitly decode files as UTF-8 because sometimes we have Russian characters in queries, and LANG=C is set.
parser.add_argument('file', metavar='FILE', type=argparse.FileType('r', encoding='utf-8'), nargs=1, help='test description file')
parser.add_argument('--host', nargs='*', default=['127.0.0.1', '127.0.0.1'])
parser.add_argument('--port', nargs='*', default=[9001, 9002])
parser.add_argument('--runs', type=int, default=int(os.environ.get('CHPC_RUNS', 7)))
args = parser.parse_args()

tree = et.parse(args.file[0])
root = tree.getroot()

# Check main metric
main_metric_element = root.find('main_metric/*')
if main_metric_element is not None and main_metric_element.tag != 'min_time':
    raise Exception('Only the min_time main metric is supported. This test uses \'{}\''.format(main_metric_element.tag))

# FIXME another way to detect infinite tests. They should have an appropriate main_metric but sometimes they don't.
infinite_sign = root.find('.//average_speed_not_changing_for_ms')
if infinite_sign is not None:
    raise Exception('Looks like the test is infinite (sign 1)')

# Open connections
servers = [{'host': host, 'port': port} for (host, port) in zip(args.host, args.port)]
connections = [clickhouse_driver.Client(**server) for server in servers]

report_stage_end('connect')

# Apply settings
settings = root.findall('settings/*')
for c in connections:
    for s in settings:
        c.execute("set {} = '{}'".format(s.tag, s.text))

# Check tables that should exist. If they don't exist, just skip this test.
tables = [e.text for e in root.findall('preconditions/table_exists')]
for t in tables:
    for c in connections:
        try:
            res = c.execute("show create table {}".format(t))
        except:
            print('skipped\t' + traceback.format_exception_only(*sys.exc_info()[:2])[-1])
            traceback.print_exc()
            sys.exit(0)

report_stage_end('preconditions')

# Process substitutions
subst_elems = root.findall('substitutions/substitution')

parameter_keys = []         # ['table',                   'limit'    ]
parameter_value_arrays = [] # [['hits_100m', 'hits_10m'], ['1', '10']]
parameter_combinations = [] # [{table: hits_100m, limit: 1}, ...]
for se in subst_elems:
    parameter_keys.append(se.find('name').text)
    parameter_value_arrays.append([v.text for v in se.findall('values/value')])
parameter_combinations = [dict(zip(parameter_keys, parameter_combination)) for parameter_combination in itertools.product(*parameter_value_arrays)]

# Take care to keep the order of queries -- sometimes we have DROP IF EXISTS
# followed by CREATE in create queries section, so the order matters.
def substitute_parameters(query_templates, parameter_combinations):
    return [template.format(**parameters) for template, parameters
        in itertools.product(query_templates, parameter_combinations)]

report_stage_end('substitute')

# Run drop queries, ignoring errors
drop_query_templates = [q.text for q in root.findall('drop_query')]
drop_queries = substitute_parameters(drop_query_templates, parameter_combinations)
for c in connections:
    for q in drop_queries:
        try:
            c.execute(q)
        except:
            traceback.print_exc()
            pass

# Run create queries
create_query_templates = [q.text for q in root.findall('create_query')]
create_queries = substitute_parameters(create_query_templates, parameter_combinations)
for c in connections:
    for q in create_queries:
        c.execute(q)

# Run fill queries
fill_query_templates = [q.text for q in root.findall('fill_query')]
fill_queries = substitute_parameters(fill_query_templates, parameter_combinations)
for c in connections:
    for q in fill_queries:
        c.execute(q)

report_stage_end('fill')

# Run test queries
def tsv_escape(s):
    return s.replace('\\', '\\\\').replace('\t', '\\t').replace('\n', '\\n').replace('\r','')

test_query_templates = [q.text for q in root.findall('query')]
test_queries = substitute_parameters(test_query_templates, parameter_combinations)

report_stage_end('substitute2')

for q in test_queries:
    # Prewarm: run once on both servers. Helps to bring the data into memory,
    # precompile the queries, etc.
    for conn_index, c in enumerate(connections):
        res = c.execute(q, query_id = 'prewarm {} {}'.format(0, q))
        print('prewarm\t' + tsv_escape(q) + '\t' + str(conn_index) + '\t' + str(c.last_query.elapsed))

    # Now, perform measured runs.
    # Track the time spent by the client to process this query, so that we can notice
    # out the queries that take long to process on the client side, e.g. by sending
    # excessive data.
    start_seconds = time.perf_counter()
    server_seconds = 0
    for run in range(0, args.runs):
        for conn_index, c in enumerate(connections):
            res = c.execute(q)
            print('query\t' + tsv_escape(q) + '\t' + str(run) + '\t' + str(conn_index) + '\t' + str(c.last_query.elapsed))
            server_seconds += c.last_query.elapsed

    client_seconds = time.perf_counter() - start_seconds
    print('client-time\t{}\t{}\t{}'.format(tsv_escape(q), client_seconds, server_seconds))

report_stage_end('benchmark')

# Run drop queries
drop_query_templates = [q.text for q in root.findall('drop_query')]
drop_queries = substitute_parameters(drop_query_templates, parameter_combinations)
for c in connections:
    for q in drop_queries:
        c.execute(q)

report_stage_end('drop')
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`#!/usr/bin/python3`

[wip] performance comparison 2020-01-21 18:15:25 +00:00			`import os`
[wip] performance comparison test 2020-01-16 14:29:30 +00:00			`import sys`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`import itertools`
			`import clickhouse_driver`
			`import xml.etree.ElementTree as et`
			`import argparse`
			`import pprint`
[wip] performance comparison test 2020-01-16 19:39:07 +00:00			`import time`
			`import traceback`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00
performance comparison 2020-02-14 12:55:47 +00:00			`stage_start_seconds = time.perf_counter()`

			`def report_stage_end(stage_name):`
			`global stage_start_seconds`
			`print('{}\t{}'.format(stage_name, time.perf_counter() - stage_start_seconds))`
			`stage_start_seconds = time.perf_counter()`

			`report_stage_end('start')`

[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`parser = argparse.ArgumentParser(description='Run performance test.')`
Performance comparison improvements. 2020-01-10 14:06:07 +00:00			`# Explicitly decode files as UTF-8 because sometimes we have Russian characters in queries, and LANG=C is set.`
			`parser.add_argument('file', metavar='FILE', type=argparse.FileType('r', encoding='utf-8'), nargs=1, help='test description file')`
[wip] performance comparison 2020-01-21 18:15:25 +00:00			`parser.add_argument('--host', nargs='*', default=['127.0.0.1', '127.0.0.1'])`
			`parser.add_argument('--port', nargs='*', default=[9001, 9002])`
			`parser.add_argument('--runs', type=int, default=int(os.environ.get('CHPC_RUNS', 7)))`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`args = parser.parse_args()`

			`tree = et.parse(args.file[0])`
			`root = tree.getroot()`

			`# Check main metric`
[wip] perf comparison: docker + some tweaks 2019-12-26 19:16:36 +00:00			`main_metric_element = root.find('main_metric/*')`
[wip] performance comparison fixes 2019-12-26 21:33:10 +00:00			`if main_metric_element is not None and main_metric_element.tag != 'min_time':`
			`raise Exception('Only the min_time main metric is supported. This test uses \'{}\''.format(main_metric_element.tag))`

			`# FIXME another way to detect infinite tests. They should have an appropriate main_metric but sometimes they don't.`
			`infinite_sign = root.find('.//average_speed_not_changing_for_ms')`
			`if infinite_sign is not None:`
			`raise Exception('Looks like the test is infinite (sign 1)')`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00
			`# Open connections`
[wip] performance comparison 2020-01-21 18:15:25 +00:00			`servers = [{'host': host, 'port': port} for (host, port) in zip(args.host, args.port)]`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`connections = [clickhouse_driver.Client(**server) for server in servers]`

performance comparison 2020-02-14 12:55:47 +00:00			`report_stage_end('connect')`

[wip] perf comparison: docker + some tweaks 2019-12-26 19:16:36 +00:00			`# Apply settings`
			`settings = root.findall('settings/*')`
			`for c in connections:`
			`for s in settings:`
			`c.execute("set {} = '{}'".format(s.tag, s.text))`

performance comparison 2020-02-28 16:22:07 +00:00			`# Check tables that should exist. If they don't exist, just skip this test.`
			`tables = [e.text for e in root.findall('preconditions/table_exists')]`
			`for t in tables:`
			`for c in connections:`
			`try:`
			`res = c.execute("show create table {}".format(t))`
			`except:`
			`print('skipped\t' + traceback.format_exception_only(*sys.exc_info()[:2])[-1])`
			`traceback.print_exc()`
			`sys.exit(0)`

performance comparison 2020-02-14 12:55:47 +00:00			`report_stage_end('preconditions')`

[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`# Process substitutions`
			`subst_elems = root.findall('substitutions/substitution')`

			`parameter_keys = [] # ['table', 'limit' ]`
			`parameter_value_arrays = [] # [['hits_100m', 'hits_10m'], ['1', '10']]`
			`parameter_combinations = [] # [{table: hits_100m, limit: 1}, ...]`
			`for se in subst_elems:`
			`parameter_keys.append(se.find('name').text)`
			`parameter_value_arrays.append([v.text for v in se.findall('values/value')])`
			`parameter_combinations = [dict(zip(parameter_keys, parameter_combination)) for parameter_combination in itertools.product(*parameter_value_arrays)]`

performance comparison 2020-02-21 19:58:52 +00:00			`# Take care to keep the order of queries -- sometimes we have DROP IF EXISTS`
			`# followed by CREATE in create queries section, so the order matters.`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`def substitute_parameters(query_templates, parameter_combinations):`
performance comparison 2020-02-21 19:58:52 +00:00			`return [template.format(**parameters) for template, parameters`
			`in itertools.product(query_templates, parameter_combinations)]`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00
performance comparison 2020-02-14 12:55:47 +00:00			`report_stage_end('substitute')`

[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`# Run drop queries, ignoring errors`
			`drop_query_templates = [q.text for q in root.findall('drop_query')]`
			`drop_queries = substitute_parameters(drop_query_templates, parameter_combinations)`
			`for c in connections:`
			`for q in drop_queries:`
			`try:`
			`c.execute(q)`
			`except:`
[wip] performance comparison test 2020-01-16 19:39:07 +00:00			`traceback.print_exc()`
			`pass`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00
			`# Run create queries`
			`create_query_templates = [q.text for q in root.findall('create_query')]`
			`create_queries = substitute_parameters(create_query_templates, parameter_combinations)`
			`for c in connections:`
			`for q in create_queries:`
			`c.execute(q)`

			`# Run fill queries`
			`fill_query_templates = [q.text for q in root.findall('fill_query')]`
			`fill_queries = substitute_parameters(fill_query_templates, parameter_combinations)`
			`for c in connections:`
			`for q in fill_queries:`
			`c.execute(q)`

performance comparison 2020-02-14 12:55:47 +00:00			`report_stage_end('fill')`

[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`# Run test queries`
[wip] performance comparison fixes 2019-12-26 21:33:10 +00:00			`def tsv_escape(s):`
			`return s.replace('\\', '\\\\').replace('\t', '\\t').replace('\n', '\\n').replace('\r','')`

[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`test_query_templates = [q.text for q in root.findall('query')]`
			`test_queries = substitute_parameters(test_query_templates, parameter_combinations)`

performance comparison 2020-02-14 12:55:47 +00:00			`report_stage_end('substitute2')`

[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`for q in test_queries:`
performance comparison 2020-02-11 20:00:53 +00:00			`# Prewarm: run once on both servers. Helps to bring the data into memory,`
performance comparison 2020-02-11 15:01:16 +00:00			`# precompile the queries, etc.`
performance comparison 2020-02-11 20:00:53 +00:00			`for conn_index, c in enumerate(connections):`
performance comparison 2020-02-20 16:28:21 +00:00			`res = c.execute(q, query_id = 'prewarm {} {}'.format(0, q))`
performance comparison 2020-02-11 20:00:53 +00:00			`print('prewarm\t' + tsv_escape(q) + '\t' + str(conn_index) + '\t' + str(c.last_query.elapsed))`
performance comparison 2020-02-11 15:01:16 +00:00
			`# Now, perform measured runs.`
[wip] performance comparison test 2020-01-16 19:39:07 +00:00			`# Track the time spent by the client to process this query, so that we can notice`
			`# out the queries that take long to process on the client side, e.g. by sending`
			`# excessive data.`
			`start_seconds = time.perf_counter()`
			`server_seconds = 0`
[wip] performance comparison 2020-01-21 18:15:25 +00:00			`for run in range(0, args.runs):`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`for conn_index, c in enumerate(connections):`
			`res = c.execute(q)`
[wip] performance comparison test 2020-01-16 19:39:07 +00:00			`print('query\t' + tsv_escape(q) + '\t' + str(run) + '\t' + str(conn_index) + '\t' + str(c.last_query.elapsed))`
			`server_seconds += c.last_query.elapsed`

			`client_seconds = time.perf_counter() - start_seconds`
			`print('client-time\t{}\t{}\t{}'.format(tsv_escape(q), client_seconds, server_seconds))`
[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00
performance comparison 2020-02-14 12:55:47 +00:00			`report_stage_end('benchmark')`

[wip] some experimental scripts for peformance comparison 2019-12-26 17:35:41 +00:00			`# Run drop queries`
			`drop_query_templates = [q.text for q in root.findall('drop_query')]`
			`drop_queries = substitute_parameters(drop_query_templates, parameter_combinations)`
			`for c in connections:`
			`for q in drop_queries:`
			`c.execute(q)`
performance comparison 2020-02-14 12:55:47 +00:00
			`report_stage_end('drop')`