mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-12 17:32:32 +00:00
8ed5cfc265
* impl
* fix style
* make executeQueryWithParallelReplicas similar to executeQuery
* impl for parallel replicas
* cleaner code for remote sorting properties
* update test
* fix
* handle when nodes of old versions participate
* small fixes
* temporary enable for testing
* fix after merge
* Revert "temporary enable for testing"
This reverts commit cce7f8884c
.
* review fixes
* add bc test
* Update src/Core/Settings.h
73 lines
3.1 KiB
SQL
73 lines
3.1 KiB
SQL
-- Tags: no-parallel
|
|
|
|
create table t(a UInt64, b UInt64) engine=MergeTree order by a;
|
|
system stop merges t;
|
|
insert into t select number, number from numbers_mt(1e6);
|
|
|
|
set enable_memory_bound_merging_of_aggregation_results = 1;
|
|
set max_threads = 4;
|
|
set optimize_aggregation_in_order = 1;
|
|
set prefer_localhost_replica = 1;
|
|
|
|
-- slightly different transforms will be generated by reading steps if we let settings randomisation to change this setting value --
|
|
set read_in_order_two_level_merge_threshold = 1000;
|
|
|
|
create table dist_t as t engine = Distributed(test_cluster_two_shards, currentDatabase(), t, a % 2);
|
|
|
|
-- { echoOn } --
|
|
explain pipeline select a from remote(test_cluster_two_shards, currentDatabase(), t) group by a;
|
|
|
|
select a from remote(test_cluster_two_shards, currentDatabase(), t) group by a order by a limit 5 offset 100500;
|
|
|
|
explain pipeline select a from remote(test_cluster_two_shards, currentDatabase(), dist_t) group by a;
|
|
|
|
select a from remote(test_cluster_two_shards, currentDatabase(), dist_t) group by a order by a limit 5 offset 100500;
|
|
|
|
-- { echoOff } --
|
|
|
|
set aggregation_in_order_max_block_bytes = '1Mi';
|
|
set max_block_size = 500;
|
|
-- actual block size might be slightly bigger than the limit --
|
|
select max(bs) < 70000 from (select avg(a), max(blockSize()) as bs from remote(test_cluster_two_shards, currentDatabase(), t) group by a);
|
|
|
|
-- beautiful case when we have different sorting key definitions in tables involved in distributed query => different plans => different sorting properties of local aggregation results --
|
|
create database if not exists shard_1;
|
|
create table t_different_dbs(a UInt64, b UInt64) engine = MergeTree order by a;
|
|
create table shard_1.t_different_dbs(a UInt64, b UInt64) engine = MergeTree order by tuple();
|
|
|
|
insert into t_different_dbs select number % 1000, number % 1000 from numbers_mt(1e6);
|
|
insert into shard_1.t_different_dbs select number % 1000, number % 1000 from numbers_mt(1e6);
|
|
|
|
create table dist_t_different_dbs as t engine = Distributed(test_cluster_two_shards_different_databases_with_local, '', t_different_dbs);
|
|
|
|
-- { echoOn } --
|
|
explain pipeline select a, count() from dist_t_different_dbs group by a order by a limit 5 offset 500;
|
|
|
|
select a, count() from dist_t_different_dbs group by a order by a limit 5 offset 500;
|
|
select a, count() from dist_t_different_dbs group by a, b order by a limit 5 offset 500;
|
|
|
|
-- { echoOff } --
|
|
|
|
set allow_experimental_parallel_reading_from_replicas = 1;
|
|
set max_parallel_replicas = 3;
|
|
set use_hedged_requests = 0;
|
|
|
|
create table pr_t(a UInt64, b UInt64) engine=MergeTree order by a;
|
|
insert into pr_t select number % 1000, number % 1000 from numbers_mt(1e6);
|
|
create table dist_pr_t as pr_t engine = Distributed(test_cluster_one_shard_three_replicas_localhost, currentDatabase(), pr_t);
|
|
|
|
-- { echoOn } --
|
|
explain pipeline select a from dist_pr_t group by a order by a limit 5 offset 500;
|
|
|
|
select a, count() from dist_pr_t group by a order by a limit 5 offset 500;
|
|
select a, count() from dist_pr_t group by a, b order by a limit 5 offset 500;
|
|
|
|
-- { echoOff } --
|
|
|
|
drop table dist_pr_t;
|
|
drop table dist_t_different_dbs;
|
|
drop table shard_1.t_different_dbs;
|
|
drop table t_different_dbs;
|
|
drop table dist_t;
|
|
drop table t;
|