ClickHouse/tests/integration/test_delayed_replica_failover/test.py

import pytest
import time
import os, sys

sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
import helpers

from helpers.cluster import ClickHouseCluster
from helpers.network import PartitionManager


cluster = ClickHouseCluster(__file__)

# Cluster with 2 shards of 2 replicas each. node_1_1 is the instance with Distributed table.
# Thus we have a shard with a local replica and a shard with remote replicas.
node_1_1 = instance_with_dist_table = cluster.add_instance(
    'node_1_1', with_zookeeper=True, main_configs=['configs/remote_servers.xml'])
node_1_2 = cluster.add_instance('node_1_2', with_zookeeper=True)
node_2_1 = cluster.add_instance('node_2_1', with_zookeeper=True)
node_2_2 = cluster.add_instance('node_2_2', with_zookeeper=True)

@pytest.fixture(scope="module")
def started_cluster():
    try:
        cluster.start()

        for shard in (1, 2):
            for replica in (1, 2):
                node = cluster.instances['node_{}_{}'.format(shard, replica)]
                node.query('''
CREATE TABLE replicated (d Date, x UInt32) ENGINE =
    ReplicatedMergeTree('/clickhouse/tables/{shard}/replicated', '{instance}', d, d, 8192)'''
                    .format(shard=shard, instance=node.name))

        node_1_1.query(
            "CREATE TABLE distributed (d Date, x UInt32) ENGINE = "
            "Distributed('test_cluster', 'default', 'replicated')")

        yield cluster

    finally:
        cluster.shutdown()


def test(started_cluster):
    with PartitionManager() as pm:
        # Hinder replication between replicas of the same shard, but leave the possibility of distributed connection.
        pm.partition_instances(node_1_1, node_1_2, port=9009)
        pm.partition_instances(node_2_1, node_2_2, port=9009)

        node_1_2.query("INSERT INTO replicated VALUES ('2017-05-08', 1)")
        node_2_2.query("INSERT INTO replicated VALUES ('2017-05-08', 2)")

        time.sleep(1) # accrue replica delay

        assert node_1_1.query("SELECT sum(x) FROM replicated").strip() == '0'
        assert node_1_2.query("SELECT sum(x) FROM replicated").strip() == '1'
        assert node_2_1.query("SELECT sum(x) FROM replicated").strip() == '0'
        assert node_2_2.query("SELECT sum(x) FROM replicated").strip() == '2'

        # With in_order balancing first replicas are chosen.
        assert instance_with_dist_table.query(
            "SELECT count() FROM distributed SETTINGS load_balancing='in_order'").strip() == '0'

        # When we set max_replica_delay, first replicas must be excluded.
        assert instance_with_dist_table.query('''
SELECT sum(x) FROM distributed SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1
''').strip() == '3'

        assert instance_with_dist_table.query('''
SELECT sum(x) FROM distributed WITH TOTALS SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1
''').strip() == '3\n\n3'

        pm.drop_instance_zk_connections(node_1_2)
        pm.drop_instance_zk_connections(node_2_2)

        time.sleep(4) # allow pings to zookeeper to timeout (must be greater than ZK session timeout).

        # At this point all replicas are stale, but the query must still go to second replicas which are the least stale ones.
        assert instance_with_dist_table.query('''
SELECT sum(x) FROM distributed SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1
''').strip() == '3'

        # Regression for skip_unavailable_shards in conjunction with skip_unavailable_shards
        assert instance_with_dist_table.query('''
SELECT sum(x) FROM distributed SETTINGS
    load_balancing='in_order',
    skip_unavailable_shards=1,
    max_replica_delay_for_distributed_queries=1
''').strip() == '3'

        # If we forbid stale replicas, the query must fail.
        with pytest.raises(Exception):
            print instance_with_dist_table.query('''
SELECT count() FROM distributed SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1,
    fallback_to_stale_replicas_for_distributed_queries=0
''')

        # Now partition off the remote replica of the local shard and test that failover still works.
        pm.partition_instances(node_1_1, node_1_2, port=9000)

        assert instance_with_dist_table.query('''
SELECT sum(x) FROM distributed SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1
''').strip() == '2'
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`import pytest`
			`import time`
Fix false IOError messages in integration tests log. [#CLICKHOUSE-2] 2017-08-14 11:49:30 +00:00			`import os, sys`

			`sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))`
			`import helpers`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
			`from helpers.cluster import ClickHouseCluster`
			`from helpers.network import PartitionManager`


			`cluster = ClickHouseCluster(__file__)`

add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`# Cluster with 2 shards of 2 replicas each. node_1_1 is the instance with Distributed table.`
			`# Thus we have a shard with a local replica and a shard with remote replicas.`
			`node_1_1 = instance_with_dist_table = cluster.add_instance(`
			`'node_1_1', with_zookeeper=True, main_configs=['configs/remote_servers.xml'])`
			`node_1_2 = cluster.add_instance('node_1_2', with_zookeeper=True)`
			`node_2_1 = cluster.add_instance('node_2_1', with_zookeeper=True)`
			`node_2_2 = cluster.add_instance('node_2_2', with_zookeeper=True)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
			`@pytest.fixture(scope="module")`
			`def started_cluster():`
			`try:`
			`cluster.start()`

add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`for shard in (1, 2):`
			`for replica in (1, 2):`
			`node = cluster.instances['node_{}_{}'.format(shard, replica)]`
			`node.query('''`
			`CREATE TABLE replicated (d Date, x UInt32) ENGINE =`
			`ReplicatedMergeTree('/clickhouse/tables/{shard}/replicated', '{instance}', d, d, 8192)'''`
			`.format(shard=shard, instance=node.name))`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`node_1_1.query(`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`"CREATE TABLE distributed (d Date, x UInt32) ENGINE = "`
			`"Distributed('test_cluster', 'default', 'replicated')")`

			`yield cluster`

			`finally:`
			`cluster.shutdown()`


			`def test(started_cluster):`
			`with PartitionManager() as pm:`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`# Hinder replication between replicas of the same shard, but leave the possibility of distributed connection.`
			`pm.partition_instances(node_1_1, node_1_2, port=9009)`
			`pm.partition_instances(node_2_1, node_2_2, port=9009)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`node_1_2.query("INSERT INTO replicated VALUES ('2017-05-08', 1)")`
			`node_2_2.query("INSERT INTO replicated VALUES ('2017-05-08', 2)")`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
			`time.sleep(1) # accrue replica delay`

fix test to conform to the new GROUP BY behaviour on empty tables 2018-03-07 18:09:26 +00:00			`assert node_1_1.query("SELECT sum(x) FROM replicated").strip() == '0'`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`assert node_1_2.query("SELECT sum(x) FROM replicated").strip() == '1'`
fix test to conform to the new GROUP BY behaviour on empty tables 2018-03-07 18:09:26 +00:00			`assert node_2_1.query("SELECT sum(x) FROM replicated").strip() == '0'`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`assert node_2_2.query("SELECT sum(x) FROM replicated").strip() == '2'`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
use stale local replica if all remote replicas are unavailable [#CLICKHOUSE-3377] 2017-10-27 20:34:21 +00:00			`# With in_order balancing first replicas are chosen.`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`assert instance_with_dist_table.query(`
fix test to conform to the new GROUP BY behaviour on empty tables 2018-03-07 18:09:26 +00:00			`"SELECT count() FROM distributed SETTINGS load_balancing='in_order'").strip() == '0'`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`# When we set max_replica_delay, first replicas must be excluded.`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`assert instance_with_dist_table.query('''`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`SELECT sum(x) FROM distributed SETTINGS`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`''').strip() == '3'`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
Update test. 2020-08-03 17:07:09 +00:00			`assert instance_with_dist_table.query('''`
			`SELECT sum(x) FROM distributed WITH TOTALS SETTINGS`
			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1`
			`''').strip() == '3\n\n3'`

add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`pm.drop_instance_zk_connections(node_1_2)`
			`pm.drop_instance_zk_connections(node_2_2)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
fix integration tests 2017-06-14 13:23:23 +00:00			`time.sleep(4) # allow pings to zookeeper to timeout (must be greater than ZK session timeout).`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`# At this point all replicas are stale, but the query must still go to second replicas which are the least stale ones.`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`assert instance_with_dist_table.query('''`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`SELECT sum(x) FROM distributed SETTINGS`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`''').strip() == '3'`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
Cover fallback_to_stale_replicas in conjunction with skip_unavailable_shards 2020-04-21 22:45:51 +00:00			`# Regression for skip_unavailable_shards in conjunction with skip_unavailable_shards`
			`assert instance_with_dist_table.query('''`
			`SELECT sum(x) FROM distributed SETTINGS`
			`load_balancing='in_order',`
			`skip_unavailable_shards=1,`
			`max_replica_delay_for_distributed_queries=1`
			`''').strip() == '3'`

ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`# If we forbid stale replicas, the query must fail.`
			`with pytest.raises(Exception):`
Updated integration tests. Add integration test for DDL. [#CLICKHOUSE-5] 2017-05-30 11:49:17 +00:00			`print instance_with_dist_table.query('''`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`SELECT count() FROM distributed SETTINGS`
			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1,`
			`fallback_to_stale_replicas_for_distributed_queries=0`
			`''')`
use stale local replica if all remote replicas are unavailable [#CLICKHOUSE-3377] 2017-10-27 20:34:21 +00:00
			`# Now partition off the remote replica of the local shard and test that failover still works.`
			`pm.partition_instances(node_1_1, node_1_2, port=9000)`

			`assert instance_with_dist_table.query('''`
			`SELECT sum(x) FROM distributed SETTINGS`
			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1`
			`''').strip() == '2'`