ClickHouse/tests/integration/test_delayed_replica_failover/test.py

import os
import sys
import time

import pytest

sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))

from helpers.cluster import ClickHouseCluster
from helpers.network import PartitionManager

cluster = ClickHouseCluster(__file__)

# Cluster with 2 shards of 2 replicas each. node_1_1 is the instance with Distributed table.
# Thus we have a shard with a local replica and a shard with remote replicas.
node_1_1 = instance_with_dist_table = cluster.add_instance(
    "node_1_1", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
)
node_1_2 = cluster.add_instance("node_1_2", with_zookeeper=True)
node_2_1 = cluster.add_instance("node_2_1", with_zookeeper=True)
node_2_2 = cluster.add_instance("node_2_2", with_zookeeper=True)

# For test to be runnable multiple times
seqno = 0


@pytest.fixture(scope="module")
def started_cluster():
    try:
        cluster.start()
        yield cluster
    finally:
        cluster.shutdown()


@pytest.fixture(scope="function", autouse=True)
def create_tables():
    global seqno
    try:
        seqno += 1
        for shard in (1, 2):
            for replica in (1, 2):
                node = cluster.instances["node_{}_{}".format(shard, replica)]
                node.query(
                    f"CREATE TABLE replicated (d Date, x UInt32) ENGINE = "
                    f"ReplicatedMergeTree('/clickhouse/tables/{shard}/replicated_{seqno}', '{node.name}') PARTITION BY toYYYYMM(d) ORDER BY d"
                )

        node_1_1.query(
            "CREATE TABLE distributed (d Date, x UInt32) ENGINE = "
            "Distributed('test_cluster', 'default', 'replicated')"
        )

        yield

    finally:
        node_1_1.query("DROP TABLE distributed")

        node_1_1.query("DROP TABLE replicated")
        node_1_2.query("DROP TABLE replicated")
        node_2_1.query("DROP TABLE replicated")
        node_2_2.query("DROP TABLE replicated")


def test(started_cluster):
    instance_with_dist_table.query(
        "SYSTEM DISABLE FAILPOINT replicated_merge_tree_all_replicas_stale"
    )
    with PartitionManager() as pm:
        # Hinder replication between replicas of the same shard, but leave the possibility of distributed connection.
        pm.partition_instances(node_1_1, node_1_2, port=9009)
        pm.partition_instances(node_2_1, node_2_2, port=9009)

        node_1_2.query("INSERT INTO replicated VALUES ('2017-05-08', 1)")
        node_2_2.query("INSERT INTO replicated VALUES ('2017-05-08', 2)")

        time.sleep(1)  # accrue replica delay

        assert node_1_1.query("SELECT sum(x) FROM replicated").strip() == "0"
        assert node_1_2.query("SELECT sum(x) FROM replicated").strip() == "1"
        assert node_2_1.query("SELECT sum(x) FROM replicated").strip() == "0"
        assert node_2_2.query("SELECT sum(x) FROM replicated").strip() == "2"

        # With in_order balancing first replicas are chosen.
        assert (
            instance_with_dist_table.query(
                "SELECT count() FROM distributed SETTINGS load_balancing='in_order'"
            ).strip()
            == "0"
        )

        # When we set max_replica_delay, first replicas must be excluded.
        assert (
            instance_with_dist_table.query(
                """
SELECT sum(x) FROM distributed SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1
"""
            ).strip()
            == "3"
        )

        assert (
            instance_with_dist_table.query(
                """
SELECT sum(x) FROM distributed WITH TOTALS SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1
"""
            ).strip()
            == "3\n\n3"
        )

        pm.drop_instance_zk_connections(node_1_2)
        pm.drop_instance_zk_connections(node_2_2)

        # allow pings to zookeeper to timeout (must be greater than ZK session timeout).
        for _ in range(30):
            try:
                node_2_2.query(
                    "SELECT * FROM system.zookeeper where path = '/' SETTINGS insert_keeper_max_retries = 0"
                )
                time.sleep(0.5)
            except:
                break
        else:
            raise Exception("Connection with zookeeper was not lost")

        instance_with_dist_table.query(
            "SYSTEM ENABLE FAILPOINT replicated_merge_tree_all_replicas_stale"
        )
        # At this point all replicas are stale, but the query must still go to second replicas which are the least stale ones.
        assert (
            instance_with_dist_table.query(
                """
SELECT sum(x) FROM distributed SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1
"""
            ).strip()
            == "3"
        )

        # Prefer fallback_to_stale_replicas over skip_unavailable_shards
        assert (
            instance_with_dist_table.query(
                """
SELECT sum(x) FROM distributed SETTINGS
    load_balancing='in_order',
    skip_unavailable_shards=1,
    max_replica_delay_for_distributed_queries=1
"""
            ).strip()
            == "3"
        )

        # If we forbid stale replicas, the query must fail. But sometimes we must have bigger timeouts.
        for _ in range(20):
            try:
                instance_with_dist_table.query(
                    """
SELECT count() FROM distributed SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1,
    fallback_to_stale_replicas_for_distributed_queries=0
"""
                )
                time.sleep(0.5)
            except:
                break
        else:
            raise Exception("Didn't raise when stale replicas are not allowed")

        # Now partition off the remote replica of the local shard and test that failover still works.
        pm.partition_instances(node_1_1, node_1_2, port=9000)

        assert (
            instance_with_dist_table.query(
                """
SELECT sum(x) FROM distributed SETTINGS
    load_balancing='in_order',
    max_replica_delay_for_distributed_queries=1
"""
            ).strip()
            == "2"
        )
Format and optimize imports in integration test files This PR formats all the `*.py` files found under the `tests/integration` folder. It also reorders the imports and cleans up a bunch of unused imports. The formatting also takes care of other things like wrapping lines and fixing spaces and indents such that the tests look more readable. 2020-09-16 04:26:10 +00:00			`import os`
			`import sys`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`import time`
Format and optimize imports in integration test files This PR formats all the `*.py` files found under the `tests/integration` folder. It also reorders the imports and cleans up a bunch of unused imports. The formatting also takes care of other things like wrapping lines and fixing spaces and indents such that the tests look more readable. 2020-09-16 04:26:10 +00:00
			`import pytest`
Fix false IOError messages in integration tests log. [#CLICKHOUSE-2] 2017-08-14 11:49:30 +00:00
			`sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
			`from helpers.cluster import ClickHouseCluster`
			`from helpers.network import PartitionManager`

			`cluster = ClickHouseCluster(__file__)`

add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`# Cluster with 2 shards of 2 replicas each. node_1_1 is the instance with Distributed table.`
			`# Thus we have a shard with a local replica and a shard with remote replicas.`
			`node_1_1 = instance_with_dist_table = cluster.add_instance(`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`"node_1_1", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]`
			`)`
			`node_1_2 = cluster.add_instance("node_1_2", with_zookeeper=True)`
			`node_2_1 = cluster.add_instance("node_2_1", with_zookeeper=True)`
			`node_2_2 = cluster.add_instance("node_2_2", with_zookeeper=True)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
make test runnable multiple times 2024-08-14 15:27:37 +00:00			`# For test to be runnable multiple times`
			`seqno = 0`
Format and optimize imports in integration test files This PR formats all the `*.py` files found under the `tests/integration` folder. It also reorders the imports and cleans up a bunch of unused imports. The formatting also takes care of other things like wrapping lines and fixing spaces and indents such that the tests look more readable. 2020-09-16 04:26:10 +00:00
Automatic style fix 2024-08-14 16:13:22 +00:00
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`@pytest.fixture(scope="module")`
			`def started_cluster():`
			`try:`
			`cluster.start()`
make test runnable multiple times 2024-08-14 15:27:37 +00:00			`yield cluster`
			`finally:`
			`cluster.shutdown()`

ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
make test runnable multiple times 2024-08-14 15:27:37 +00:00			`@pytest.fixture(scope="function", autouse=True)`
			`def create_tables():`
			`global seqno`
			`try:`
			`seqno += 1`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`for shard in (1, 2):`
			`for replica in (1, 2):`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`node = cluster.instances["node_{}_{}".format(shard, replica)]`
			`node.query(`
make test runnable multiple times 2024-08-14 15:27:37 +00:00			`f"CREATE TABLE replicated (d Date, x UInt32) ENGINE = "`
			`f"ReplicatedMergeTree('/clickhouse/tables/{shard}/replicated_{seqno}', '{node.name}') PARTITION BY toYYYYMM(d) ORDER BY d"`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`node_1_1.query(`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`"CREATE TABLE distributed (d Date, x UInt32) ENGINE = "`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`"Distributed('test_cluster', 'default', 'replicated')"`
			`)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
make test runnable multiple times 2024-08-14 15:27:37 +00:00			`yield`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
			`finally:`
make test runnable multiple times 2024-08-14 15:27:37 +00:00			`node_1_1.query("DROP TABLE distributed")`

			`node_1_1.query("DROP TABLE replicated")`
			`node_1_2.query("DROP TABLE replicated")`
			`node_2_1.query("DROP TABLE replicated")`
			`node_2_2.query("DROP TABLE replicated")`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00

			`def test(started_cluster):`
Fix test_delayed_replica_failover 2024-09-20 13:31:23 +00:00			`instance_with_dist_table.query(`
			`"SYSTEM DISABLE FAILPOINT replicated_merge_tree_all_replicas_stale"`
			`)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`with PartitionManager() as pm:`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`# Hinder replication between replicas of the same shard, but leave the possibility of distributed connection.`
			`pm.partition_instances(node_1_1, node_1_2, port=9009)`
			`pm.partition_instances(node_2_1, node_2_2, port=9009)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`node_1_2.query("INSERT INTO replicated VALUES ('2017-05-08', 1)")`
			`node_2_2.query("INSERT INTO replicated VALUES ('2017-05-08', 2)")`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
Format and optimize imports in integration test files This PR formats all the `*.py` files found under the `tests/integration` folder. It also reorders the imports and cleans up a bunch of unused imports. The formatting also takes care of other things like wrapping lines and fixing spaces and indents such that the tests look more readable. 2020-09-16 04:26:10 +00:00			`time.sleep(1) # accrue replica delay`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`assert node_1_1.query("SELECT sum(x) FROM replicated").strip() == "0"`
			`assert node_1_2.query("SELECT sum(x) FROM replicated").strip() == "1"`
			`assert node_2_1.query("SELECT sum(x) FROM replicated").strip() == "0"`
			`assert node_2_2.query("SELECT sum(x) FROM replicated").strip() == "2"`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
use stale local replica if all remote replicas are unavailable [#CLICKHOUSE-3377] 2017-10-27 20:34:21 +00:00			`# With in_order balancing first replicas are chosen.`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`assert (`
			`instance_with_dist_table.query(`
			`"SELECT count() FROM distributed SETTINGS load_balancing='in_order'"`
			`).strip()`
			`== "0"`
			`)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`# When we set max_replica_delay, first replicas must be excluded.`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`assert (`
			`instance_with_dist_table.query(`
			`"""`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`SELECT sum(x) FROM distributed SETTINGS`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`"""`
			`).strip()`
			`== "3"`
			`)`

			`assert (`
			`instance_with_dist_table.query(`
			`"""`
Update test. 2020-08-03 17:07:09 +00:00			`SELECT sum(x) FROM distributed WITH TOTALS SETTINGS`
			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`"""`
			`).strip()`
			`== "3\n\n3"`
			`)`
Update test. 2020-08-03 17:07:09 +00:00
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`pm.drop_instance_zk_connections(node_1_2)`
			`pm.drop_instance_zk_connections(node_2_2)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
Fix two flaky integration tests 2022-01-14 11:27:36 +00:00			`# allow pings to zookeeper to timeout (must be greater than ZK session timeout).`
Fixup 2022-01-14 11:28:44 +00:00			`for _ in range(30):`
Fix two flaky integration tests 2022-01-14 11:27:36 +00:00			`try:`
Automatic style fix 2024-07-31 16:50:56 +00:00			`node_2_2.query(`
			`"SELECT * FROM system.zookeeper where path = '/' SETTINGS insert_keeper_max_retries = 0"`
			`)`
Fix two flaky integration tests 2022-01-14 11:27:36 +00:00			`time.sleep(0.5)`
			`except:`
			`break`
			`else:`
			`raise Exception("Connection with zookeeper was not lost")`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
Fix test_delayed_replica_failover 2024-09-20 13:31:23 +00:00			`instance_with_dist_table.query(`
			`"SYSTEM ENABLE FAILPOINT replicated_merge_tree_all_replicas_stale"`
			`)`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`# At this point all replicas are stale, but the query must still go to second replicas which are the least stale ones.`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`assert (`
			`instance_with_dist_table.query(`
			`"""`
add test [#CLICKHOUSE-3151] 2017-08-01 17:36:00 +00:00			`SELECT sum(x) FROM distributed SETTINGS`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`"""`
			`).strip()`
			`== "3"`
			`)`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00
Fix flaky `test_delayed_replica_failover` 2024-07-31 15:22:48 +00:00			`# Prefer fallback_to_stale_replicas over skip_unavailable_shards`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`assert (`
			`instance_with_dist_table.query(`
			`"""`
Cover fallback_to_stale_replicas in conjunction with skip_unavailable_shards 2020-04-21 22:45:51 +00:00			`SELECT sum(x) FROM distributed SETTINGS`
			`load_balancing='in_order',`
			`skip_unavailable_shards=1,`
			`max_replica_delay_for_distributed_queries=1`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`"""`
			`).strip()`
			`== "3"`
			`)`
Cover fallback_to_stale_replicas in conjunction with skip_unavailable_shards 2020-04-21 22:45:51 +00:00
Fix two flaky integration tests 2022-01-14 11:27:36 +00:00			`# If we forbid stale replicas, the query must fail. But sometimes we must have bigger timeouts.`
More retries 2022-01-14 17:05:55 +00:00			`for _ in range(20):`
			`try:`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`instance_with_dist_table.query(`
			`"""`
ClickHouse integration tests. [#CLICKHOUSE-2821] 2017-05-19 18:54:05 +00:00			`SELECT count() FROM distributed SETTINGS`
			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1,`
			`fallback_to_stale_replicas_for_distributed_queries=0`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`"""`
			`)`
More retries 2022-01-14 17:05:55 +00:00			`time.sleep(0.5)`
			`except:`
			`break`
			`else:`
			`raise Exception("Didn't raise when stale replicas are not allowed")`
use stale local replica if all remote replicas are unavailable [#CLICKHOUSE-3377] 2017-10-27 20:34:21 +00:00
			`# Now partition off the remote replica of the local shard and test that failover still works.`
			`pm.partition_instances(node_1_1, node_1_2, port=9000)`

Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`assert (`
			`instance_with_dist_table.query(`
			`"""`
use stale local replica if all remote replicas are unavailable [#CLICKHOUSE-3377] 2017-10-27 20:34:21 +00:00			`SELECT sum(x) FROM distributed SETTINGS`
			`load_balancing='in_order',`
			`max_replica_delay_for_distributed_queries=1`
Apply black formatter to all *.py files in the repo 2022-03-22 16:39:58 +00:00			`"""`
			`).strip()`
			`== "2"`
			`)`