ClickHouse/tests/integration/test_keeper_three_nodes_two_alive/test.py
2024-09-27 10:19:49 +00:00

169 lines
4.3 KiB
Python

#!/usr/bin/env python3
import os
import random
import string
import time
from multiprocessing.dummy import Pool
import pytest
from kazoo.client import KazooClient, KazooState
import helpers.keeper_utils as keeper_utils
from helpers.cluster import ClickHouseCluster
from helpers.test_tools import assert_eq_with_retry
cluster = ClickHouseCluster(__file__)
node1 = cluster.add_instance(
"node1",
main_configs=["configs/enable_keeper1.xml", "configs/keeper_conf.xml"],
stay_alive=True,
)
node2 = cluster.add_instance(
"node2",
main_configs=["configs/enable_keeper2.xml", "configs/keeper_conf.xml"],
stay_alive=True,
)
node3 = cluster.add_instance(
"node3",
main_configs=["configs/enable_keeper3.xml", "configs/keeper_conf.xml"],
stay_alive=True,
)
def get_fake_zk(nodename, timeout=30.0):
_fake_zk_instance = KazooClient(
hosts=cluster.get_instance_ip(nodename) + ":9181", timeout=timeout
)
_fake_zk_instance.start()
return _fake_zk_instance
@pytest.fixture(scope="module")
def started_cluster():
try:
cluster.start()
yield cluster
finally:
cluster.shutdown()
def start(node):
node.start_clickhouse()
keeper_utils.wait_until_connected(cluster, node)
def delete_with_retry(node_name, path):
for _ in range(30):
zk = None
try:
zk = get_fake_zk(node_name)
zk.delete(path)
return
except:
time.sleep(0.5)
finally:
zk.stop()
zk.close()
raise Exception(f"Cannot delete {path} from node {node_name}")
def test_start_offline(started_cluster):
p = Pool(3)
try:
node1_zk = get_fake_zk("node1")
node1_zk.create("/test_alive", b"aaaa")
node1.stop_clickhouse()
node2.stop_clickhouse()
node3.stop_clickhouse()
time.sleep(3)
p.map(start, [node2, node3])
assert node2.contains_in_log(
"Cannot connect to ZooKeeper (or Keeper) before internal Keeper start"
)
assert node3.contains_in_log(
"Cannot connect to ZooKeeper (or Keeper) before internal Keeper start"
)
node2_zk = get_fake_zk("node2")
node2_zk.create("/c", b"data")
finally:
p.map(start, [node1, node2, node3])
delete_with_retry("node1", "/test_alive")
node1_zk.stop()
node1_zk.close()
def test_start_non_existing(started_cluster):
p = Pool(3)
node2_zk = None
try:
node1.stop_clickhouse()
node2.stop_clickhouse()
node3.stop_clickhouse()
node1.replace_in_config(
"/etc/clickhouse-server/config.d/enable_keeper1.xml",
"node3",
"non_existing_node",
)
node2.replace_in_config(
"/etc/clickhouse-server/config.d/enable_keeper2.xml",
"node3",
"non_existing_node",
)
time.sleep(3)
p.map(start, [node2, node1])
assert node1.contains_in_log(
"Cannot connect to ZooKeeper (or Keeper) before internal Keeper start"
)
assert node2.contains_in_log(
"Cannot connect to ZooKeeper (or Keeper) before internal Keeper start"
)
node2_zk = get_fake_zk("node2")
node2_zk.create("/test_non_exising", b"data")
finally:
node1.replace_in_config(
"/etc/clickhouse-server/config.d/enable_keeper1.xml",
"non_existing_node",
"node3",
)
node2.replace_in_config(
"/etc/clickhouse-server/config.d/enable_keeper2.xml",
"non_existing_node",
"node3",
)
p.map(start, [node1, node2, node3])
delete_with_retry("node2", "/test_non_exising")
if node2_zk:
node2_zk.stop()
node2_zk.close()
def test_restart_third_node(started_cluster):
try:
node1_zk = get_fake_zk("node1")
node1_zk.create("/test_restart", b"aaaa")
node3.restart_clickhouse()
keeper_utils.wait_until_connected(cluster, node3)
assert node3.contains_in_log(
"Connected to ZooKeeper (or Keeper) before internal Keeper start"
)
node1_zk.delete("/test_restart")
finally:
node1_zk.stop()
node1_zk.close()