2017-07-17 15:36:27 +00:00
<test >
2017-07-17 18:01:47 +00:00
<name > test_hits</name>
<type > loop</type>
2017-07-17 15:36:27 +00:00
<stop_conditions >
2017-07-17 18:01:47 +00:00
<all_of >
2017-07-18 20:41:24 +00:00
<iterations > 3</iterations>
2017-07-17 18:01:47 +00:00
<min_time_not_changing_for_ms > 10000</min_time_not_changing_for_ms>
</all_of>
2017-07-17 15:36:27 +00:00
<any_of >
2017-07-18 20:41:24 +00:00
<iterations > 5</iterations>
2017-07-17 18:01:47 +00:00
<total_time_ms > 60000</total_time_ms>
2017-07-17 15:36:27 +00:00
</any_of>
</stop_conditions>
2017-07-17 18:01:47 +00:00
<main_metric >
<min_time />
</main_metric>
2017-07-17 15:36:27 +00:00
<preconditions >
<table_exists > test.hits</table_exists>
</preconditions>
2017-07-17 18:01:47 +00:00
<!-- 14. Некриптографическая хэш - функция для строк небольшой длины.
2017-07-17 15:36:27 +00:00
В качестве данных в следующих тестах будут использованы поисковые фразы (SearchPhrase), URL и PageCharset.
Строка SearchPhrase непустая только в 6.8% случаев. Средняя длина непустой строки - 47 байт.
URL почти всегда непуст и е г о средняя длина - 77 байт.
PageCharset тоже почти всегда непуст, но е г о средняя длина поменьше - 6.2 байта. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(cityHash64(SearchPhrase)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(cityHash64(SearchPhrase))</query>
2017-07-17 15:36:27 +00:00
<!-- 15. Некриптографическая хэш - функция для строк небольшой длины. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(farmHash64(SearchPhrase)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(farmHash64(SearchPhrase))</query>
2017-07-17 15:36:27 +00:00
<!-- 16. Некриптографическая хэш - функция для строк небольшой длины. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(metroHash64(SearchPhrase)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(metroHash64(SearchPhrase))</query>
2017-07-17 15:36:27 +00:00
<!-- 17. Криптографическая хэш - функция для строк. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(sipHash64(SearchPhrase)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(sipHash64(SearchPhrase))</query>
2017-07-17 15:36:27 +00:00
<!-- 18. Криптографическая хэш - функция для строк. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(MD5(SearchPhrase)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(MD5(SearchPhrase))</query>
2017-07-17 15:36:27 +00:00
<!-- 19. Криптографическая хэш - функция для строк. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(MD5(URL)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(MD5(URL))</query>
2017-07-17 15:36:27 +00:00
<!-- 20. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(cityHash64(URL)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(cityHash64(URL))</query>
2017-07-17 15:36:27 +00:00
<!-- 21. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(sipHash64(URL)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(sipHash64(URL))</query>
2017-07-17 15:36:27 +00:00
<!-- 22. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(cityHash64(PageCharset)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(cityHash64(PageCharset))</query>
2017-07-17 15:36:27 +00:00
<!-- 23. Поиск подстроки в строке. -->
<query > SELECT count() FROM test.hits WHERE URL LIKE '%metrika%' SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE URL LIKE '%metrika%'</query>
2017-07-17 15:36:27 +00:00
<!-- 24. Более сложный поиск подстроки в строке. -->
<query > SELECT count() FROM test.hits WHERE positionCaseInsensitiveUTF8(URL, 'новости') != 0 SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE positionCaseInsensitiveUTF8(URL, 'новости') != 0</query>
2017-07-17 15:36:27 +00:00
<!-- 25. Регексп. -->
<query > SELECT count() FROM test.hits WHERE match(URL, '^https?://(?:www\\.)?metri[kc]a\\.yandex\\.(?:ru|com|com\\.tr|ua|by|kz)/.+?2014') SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE match(URL, '^https?://(?:www\\.)?metri[kc]a\\.yandex\\.(?:ru|com|com\\.tr|ua|by|kz)/.+?2014')</query>
2017-07-17 15:36:27 +00:00
<!-- 34. Сложная агрегация. -->
<query > SELECT SearchEngineID, SearchPhrase, RegionID FROM test.hits GROUP BY SearchEngineID, SearchPhrase, RegionID ORDER BY count() DESC LIMIT 10 SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT SearchEngineID, SearchPhrase, RegionID FROM test.hits GROUP BY SearchEngineID, SearchPhrase, RegionID ORDER BY count() DESC LIMIT 10</query>
2017-07-17 15:36:27 +00:00
<!-- 36. Функция для работы с датой и временем. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(toMonday(EventTime)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(toMonday(EventTime))</query>
2017-07-17 15:36:27 +00:00
<!-- 37. Функция для работы с URL. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(cutQueryString(URL)) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(cutQueryString(URL))</query>
2017-07-17 15:36:27 +00:00
<!-- 38. Разные алгоритмы вычисления квантилей. -->
<query > SELECT quantilesIf(0.5, 0.9)(SendTiming, SendTiming > 0) FROM test.hits SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT quantilesIf(0.5, 0.9)(SendTiming, SendTiming > 0) FROM test.hits</query>
2017-07-17 15:36:27 +00:00
<!-- 39. Разные алгоритмы вычисления квантилей. -->
<query > SELECT quantilesTimingIf(0.5, 0.9)(SendTiming, SendTiming > 0) FROM test.hits SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT quantilesTimingIf(0.5, 0.9)(SendTiming, SendTiming > 0) FROM test.hits</query>
2017-07-17 15:36:27 +00:00
<!-- 40. Разные алгоритмы вычисления квантилей. -->
<query > SELECT quantilesExactIf(0.5, 0.9)(SendTiming, SendTiming > 0) FROM test.hits SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT quantilesExactIf(0.5, 0.9)(SendTiming, SendTiming > 0) FROM test.hits</query>
2017-07-17 15:36:27 +00:00
<!-- 41. Разные алгоритмы вычисления квантилей. -->
<query > SELECT quantilesTDigestIf(0.5, 0.9)(SendTiming, SendTiming > 0) FROM test.hits SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT quantilesTDigestIf(0.5, 0.9)(SendTiming, SendTiming > 0) FROM test.hits</query>
2017-07-17 15:36:27 +00:00
<!-- 42. Разные алгоритмы вычисления кардинальности. -->
<query > SELECT uniq(UserID) FROM test.hits SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT uniq(UserID) FROM test.hits</query>
2017-07-17 15:36:27 +00:00
<!-- 43. Разные алгоритмы вычисления кардинальности. -->
<query > SELECT uniqCombined(UserID) FROM test.hits SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT uniqCombined(UserID) FROM test.hits</query>
2017-07-17 15:36:27 +00:00
<!-- 44. Разные алгоритмы вычисления кардинальности. -->
<query > SELECT uniqExact(UserID) FROM test.hits SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT uniqExact(UserID) FROM test.hits</query>
2017-07-17 15:36:27 +00:00
<!-- 45. Что - то чуть более похожее на реальный запрос. -->
<query > SELECT RegionID, uniq(UserID) FROM test.hits GROUP BY RegionID SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT RegionID, uniq(UserID) FROM test.hits GROUP BY RegionID</query>
2017-07-17 15:36:27 +00:00
<!-- 47. Читаем и разжимаем все столбцы, и ничего с ними потом не делаем. -->
<query > SELECT count() FROM test.hits WHERE NOT ignore(*) SETTINGS max_threads = 1</query>
2017-07-18 20:41:24 +00:00
<query > SELECT count() FROM test.hits WHERE NOT ignore(*)</query>
2017-07-17 15:36:27 +00:00
</test>