ClickHouse/tests/integration/test_s3_zero_copy_replication/test.py

import logging
import time

import pytest
from helpers.cluster import ClickHouseCluster

logging.getLogger().setLevel(logging.INFO)
logging.getLogger().addHandler(logging.StreamHandler())


@pytest.fixture(scope="module")
def cluster():
    try:
        cluster = ClickHouseCluster(__file__)
        cluster.add_instance("node1", main_configs=["configs/config.d/s3.xml"], macros={'replica': '1'},
                             with_minio=True,
                             with_zookeeper=True)
        cluster.add_instance("node2", main_configs=["configs/config.d/s3.xml"], macros={'replica': '2'},
                             with_minio=True,
                             with_zookeeper=True)
        logging.info("Starting cluster...")
        cluster.start()
        logging.info("Cluster started")

        yield cluster
    finally:
        cluster.shutdown()


def get_large_objects_count(cluster, size=100):
    minio = cluster.minio_client
    counter = 0
    for obj in minio.list_objects(cluster.minio_bucket, 'data/'):
        if obj.size >= size:
            counter = counter + 1
    return counter


def wait_for_large_objects_count(cluster, expected, size=100, timeout=30):
    while timeout > 0:
        if get_large_objects_count(cluster, size) == expected:
            return
        timeout -= 1
        time.sleep(1)
    assert get_large_objects_count(cluster, size) == expected


@pytest.mark.parametrize(
    "policy", ["s3"]
)
def test_s3_zero_copy_replication(cluster, policy):
    node1 = cluster.instances["node1"]
    node2 = cluster.instances["node2"]

    node1.query(
        """
        CREATE TABLE s3_test ON CLUSTER test_cluster (id UInt32, value String)
        ENGINE=ReplicatedMergeTree('/clickhouse/tables/s3_test', '{}')
        ORDER BY id
        SETTINGS storage_policy='{}'
        """
            .format('{replica}', policy)
    )

    node1.query("INSERT INTO s3_test VALUES (0,'data'),(1,'data')")
    time.sleep(1)
    assert node1.query("SELECT * FROM s3_test order by id FORMAT Values") == "(0,'data'),(1,'data')"
    assert node2.query("SELECT * FROM s3_test order by id FORMAT Values") == "(0,'data'),(1,'data')"

    # Based on version 20.x - should be only one file with size 100+ (checksums.txt), used by both nodes
    assert get_large_objects_count(cluster) == 1

    node2.query("INSERT INTO s3_test VALUES (2,'data'),(3,'data')")
    time.sleep(1)
    assert node2.query("SELECT * FROM s3_test order by id FORMAT Values") == "(0,'data'),(1,'data'),(2,'data'),(3,'data')"
    assert node1.query("SELECT * FROM s3_test order by id FORMAT Values") == "(0,'data'),(1,'data'),(2,'data'),(3,'data')"

    # Based on version 20.x - two parts
    wait_for_large_objects_count(cluster, 2)

    node1.query("OPTIMIZE TABLE s3_test")

    # Based on version 20.x - after merge, two old parts and one merged
    wait_for_large_objects_count(cluster, 3)

    # Based on version 20.x - after cleanup - only one merged part
    wait_for_large_objects_count(cluster, 1, timeout=60)

    node1.query("DROP TABLE IF EXISTS s3_test NO DELAY")
    node2.query("DROP TABLE IF EXISTS s3_test NO DELAY")


def test_s3_zero_copy_on_hybrid_storage(cluster):
    node1 = cluster.instances["node1"]
    node2 = cluster.instances["node2"]

    node1.query(
        """
        CREATE TABLE hybrid_test ON CLUSTER test_cluster (id UInt32, value String)
        ENGINE=ReplicatedMergeTree('/clickhouse/tables/hybrid_test', '{}')
        ORDER BY id
        SETTINGS storage_policy='hybrid'
        """
            .format('{replica}')
    )

    node1.query("INSERT INTO hybrid_test VALUES (0,'data'),(1,'data')")

    time.sleep(1)

    assert node1.query("SELECT * FROM hybrid_test ORDER BY id FORMAT Values") == "(0,'data'),(1,'data')"
    assert node2.query("SELECT * FROM hybrid_test ORDER BY id FORMAT Values") == "(0,'data'),(1,'data')"

    assert node1.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','default')"
    assert node2.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','default')"

    node1.query("ALTER TABLE hybrid_test MOVE PARTITION ID 'all' TO DISK 's31'")

    assert node1.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','s31')"
    assert node2.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','default')"

    # Total objects in S3
    s3_objects = get_large_objects_count(cluster, 0)

    node2.query("ALTER TABLE hybrid_test MOVE PARTITION ID 'all' TO DISK 's31'")

    assert node1.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','s31')"
    assert node2.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','s31')"

    # Check that after moving partition on node2 no new obects on s3
    wait_for_large_objects_count(cluster, s3_objects, size=0)

    assert node1.query("SELECT * FROM hybrid_test ORDER BY id FORMAT Values") == "(0,'data'),(1,'data')"
    assert node2.query("SELECT * FROM hybrid_test ORDER BY id FORMAT Values") == "(0,'data'),(1,'data')"

    node1.query("DROP TABLE IF EXISTS hybrid_test NO DELAY")
    node2.query("DROP TABLE IF EXISTS hybrid_test NO DELAY")
Zero copy replication over S3: base tests 2020-10-19 12:20:45 +00:00			`import logging`
			`import time`

			`import pytest`
			`from helpers.cluster import ClickHouseCluster`

			`logging.getLogger().setLevel(logging.INFO)`
			`logging.getLogger().addHandler(logging.StreamHandler())`


			`@pytest.fixture(scope="module")`
			`def cluster():`
			`try:`
			`cluster = ClickHouseCluster(__file__)`
			`cluster.add_instance("node1", main_configs=["configs/config.d/s3.xml"], macros={'replica': '1'},`
			`with_minio=True,`
			`with_zookeeper=True)`
			`cluster.add_instance("node2", main_configs=["configs/config.d/s3.xml"], macros={'replica': '2'},`
			`with_minio=True,`
			`with_zookeeper=True)`
			`logging.info("Starting cluster...")`
			`cluster.start()`
			`logging.info("Cluster started")`

			`yield cluster`
			`finally:`
			`cluster.shutdown()`


			`def get_large_objects_count(cluster, size=100):`
			`minio = cluster.minio_client`
			`counter = 0`
			`for obj in minio.list_objects(cluster.minio_bucket, 'data/'):`
			`if obj.size >= size:`
			`counter = counter + 1`
			`return counter`


Fix flapping tests test_s3_zero_copy_replication, test_s3_zero_copy_on_hybrid_storage 2021-04-16 10:23:38 +00:00			`def wait_for_large_objects_count(cluster, expected, size=100, timeout=30):`
			`while timeout > 0:`
			`if get_large_objects_count(cluster, size) == expected:`
			`return`
			`timeout -= 1`
			`time.sleep(1)`
			`assert get_large_objects_count(cluster, size) == expected`


Zero copy replication over S3: base tests 2020-10-19 12:20:45 +00:00			`@pytest.mark.parametrize(`
			`"policy", ["s3"]`
			`)`
			`def test_s3_zero_copy_replication(cluster, policy):`
			`node1 = cluster.instances["node1"]`
			`node2 = cluster.instances["node2"]`

			`node1.query(`
			`"""`
			`CREATE TABLE s3_test ON CLUSTER test_cluster (id UInt32, value String)`
			`ENGINE=ReplicatedMergeTree('/clickhouse/tables/s3_test', '{}')`
			`ORDER BY id`
			`SETTINGS storage_policy='{}'`
			`"""`
			`.format('{replica}', policy)`
			`)`

			`node1.query("INSERT INTO s3_test VALUES (0,'data'),(1,'data')")`
S3 zero copy replication: fix tests 2020-10-23 10:01:40 +00:00			`time.sleep(1)`
Zero copy replication over S3: base tests 2020-10-19 12:20:45 +00:00			`assert node1.query("SELECT * FROM s3_test order by id FORMAT Values") == "(0,'data'),(1,'data')"`
			`assert node2.query("SELECT * FROM s3_test order by id FORMAT Values") == "(0,'data'),(1,'data')"`

			`# Based on version 20.x - should be only one file with size 100+ (checksums.txt), used by both nodes`
			`assert get_large_objects_count(cluster) == 1`

			`node2.query("INSERT INTO s3_test VALUES (2,'data'),(3,'data')")`
S3 zero copy replication: fix tests 2020-10-23 10:01:40 +00:00			`time.sleep(1)`
Zero copy replication over S3: base tests 2020-10-19 12:20:45 +00:00			`assert node2.query("SELECT * FROM s3_test order by id FORMAT Values") == "(0,'data'),(1,'data'),(2,'data'),(3,'data')"`
			`assert node1.query("SELECT * FROM s3_test order by id FORMAT Values") == "(0,'data'),(1,'data'),(2,'data'),(3,'data')"`

			`# Based on version 20.x - two parts`
Fix flapping tests test_s3_zero_copy_replication, test_s3_zero_copy_on_hybrid_storage 2021-04-16 10:23:38 +00:00			`wait_for_large_objects_count(cluster, 2)`
Zero copy replication over S3: base tests 2020-10-19 12:20:45 +00:00
			`node1.query("OPTIMIZE TABLE s3_test")`

			`# Based on version 20.x - after merge, two old parts and one merged`
Fix flapping tests test_s3_zero_copy_replication, test_s3_zero_copy_on_hybrid_storage 2021-04-16 10:23:38 +00:00			`wait_for_large_objects_count(cluster, 3)`
Zero copy replication over S3: base tests 2020-10-19 12:20:45 +00:00
			`# Based on version 20.x - after cleanup - only one merged part`
Fix flapping tests test_s3_zero_copy_replication, test_s3_zero_copy_on_hybrid_storage 2021-04-16 10:23:38 +00:00			`wait_for_large_objects_count(cluster, 1, timeout=60)`
Zero copy replication over S3: base tests 2020-10-19 12:20:45 +00:00
			`node1.query("DROP TABLE IF EXISTS s3_test NO DELAY")`
			`node2.query("DROP TABLE IF EXISTS s3_test NO DELAY")`

Fix S3 Zero-Copy replication for hybrid storage 2021-03-30 17:38:04 +00:00
			`def test_s3_zero_copy_on_hybrid_storage(cluster):`
			`node1 = cluster.instances["node1"]`
			`node2 = cluster.instances["node2"]`

			`node1.query(`
			`"""`
			`CREATE TABLE hybrid_test ON CLUSTER test_cluster (id UInt32, value String)`
Fix flapping test_s3_zero_copy_replication 2021-04-01 13:40:52 +00:00			`ENGINE=ReplicatedMergeTree('/clickhouse/tables/hybrid_test', '{}')`
Fix S3 Zero-Copy replication for hybrid storage 2021-03-30 17:38:04 +00:00			`ORDER BY id`
			`SETTINGS storage_policy='hybrid'`
			`"""`
			`.format('{replica}')`
			`)`

			`node1.query("INSERT INTO hybrid_test VALUES (0,'data'),(1,'data')")`

			`time.sleep(1)`

			`assert node1.query("SELECT * FROM hybrid_test ORDER BY id FORMAT Values") == "(0,'data'),(1,'data')"`
			`assert node2.query("SELECT * FROM hybrid_test ORDER BY id FORMAT Values") == "(0,'data'),(1,'data')"`

			`assert node1.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','default')"`
			`assert node2.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','default')"`

			`node1.query("ALTER TABLE hybrid_test MOVE PARTITION ID 'all' TO DISK 's31'")`

			`assert node1.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','s31')"`
			`assert node2.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','default')"`

			`# Total objects in S3`
			`s3_objects = get_large_objects_count(cluster, 0)`

			`node2.query("ALTER TABLE hybrid_test MOVE PARTITION ID 'all' TO DISK 's31'")`

			`assert node1.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','s31')"`
			`assert node2.query("SELECT partition_id,disk_name FROM system.parts WHERE table='hybrid_test' FORMAT Values") == "('all','s31')"`

			`# Check that after moving partition on node2 no new obects on s3`
Fix flapping tests test_s3_zero_copy_replication, test_s3_zero_copy_on_hybrid_storage 2021-04-16 10:23:38 +00:00			`wait_for_large_objects_count(cluster, s3_objects, size=0)`
Fix S3 Zero-Copy replication for hybrid storage 2021-03-30 17:38:04 +00:00
			`assert node1.query("SELECT * FROM hybrid_test ORDER BY id FORMAT Values") == "(0,'data'),(1,'data')"`
			`assert node2.query("SELECT * FROM hybrid_test ORDER BY id FORMAT Values") == "(0,'data'),(1,'data')"`
Fix flapping test_s3_zero_copy_replication 2021-04-01 13:40:52 +00:00
			`node1.query("DROP TABLE IF EXISTS hybrid_test NO DELAY")`
			`node2.query("DROP TABLE IF EXISTS hybrid_test NO DELAY")`