import os.path import pytest import logging from helpers.cluster import ClickHouseCluster from helpers.test_tools import TSV cluster = ClickHouseCluster(__file__) instance = cluster.add_instance("node") path_to_data = "/var/lib/clickhouse/" @pytest.fixture(scope="module") def started_cluster(): try: cluster.start() instance.query( "CREATE DATABASE test ENGINE = Ordinary" ) # Different path in shadow/ with Atomic instance.query("DROP TABLE IF EXISTS test.tbl") instance.query( "CREATE TABLE test.tbl (p Date, k Int8) ENGINE = MergeTree PARTITION BY toYYYYMM(p) ORDER BY p" ) for i in range(1, 4): instance.query( "INSERT INTO test.tbl (p, k) VALUES(toDate({}), {})".format(i, i) ) for i in range(31, 34): instance.query( "INSERT INTO test.tbl (p, k) VALUES(toDate({}), {})".format(i, i) ) expected = TSV( "1970-01-02\t1\n1970-01-03\t2\n1970-01-04\t3\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33" ) res = instance.query("SELECT * FROM test.tbl ORDER BY p") assert TSV(res) == expected instance.query("ALTER TABLE test.tbl FREEZE") yield cluster finally: cluster.shutdown() def get_last_backup_path(instance, database, table): fp_increment = os.path.join(path_to_data, "shadow/increment.txt") increment = instance.exec_in_container(["cat", fp_increment]).strip() return os.path.join(path_to_data, "shadow", increment, "data", database, table) def copy_backup_to_detached(instance, database, src_table, dst_table): fp_backup = os.path.join(path_to_data, "shadow", "*", "data", database, src_table) fp_detached = os.path.join(path_to_data, "data", database, dst_table, "detached") logging.debug(f"copy from {fp_backup} to {fp_detached}") instance.exec_in_container(["bash", "-c", f"cp -r {fp_backup} -T {fp_detached}"]) def test_restore(started_cluster): instance.query("CREATE TABLE test.tbl1 AS test.tbl") copy_backup_to_detached(started_cluster.instances["node"], "test", "tbl", "tbl1") # The data_version of parts to be attached are larger than the newly created table's data_version. instance.query("ALTER TABLE test.tbl1 ATTACH PARTITION 197001") instance.query("ALTER TABLE test.tbl1 ATTACH PARTITION 197002") instance.query("SELECT sleep(2)") # Validate the attached parts are identical to the backup. expected = TSV( "1970-01-02\t1\n1970-01-03\t2\n1970-01-04\t3\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33" ) res = instance.query("SELECT * FROM test.tbl1 ORDER BY p") assert TSV(res) == expected instance.query("ALTER TABLE test.tbl1 UPDATE k=10 WHERE 1") instance.query("SELECT sleep(2)") # Validate mutation has been applied to all attached parts. expected = TSV( "1970-01-02\t10\n1970-01-03\t10\n1970-01-04\t10\n1970-02-01\t10\n1970-02-02\t10\n1970-02-03\t10" ) res = instance.query("SELECT * FROM test.tbl1 ORDER BY p") assert TSV(res) == expected instance.query("DROP TABLE IF EXISTS test.tbl1") def test_attach_partition(started_cluster): instance.query("CREATE TABLE test.tbl2 AS test.tbl") for i in range(3, 5): instance.query( "INSERT INTO test.tbl2(p, k) VALUES(toDate({}), {})".format(i, i) ) for i in range(33, 35): instance.query( "INSERT INTO test.tbl2(p, k) VALUES(toDate({}), {})".format(i, i) ) expected = TSV("1970-01-04\t3\n1970-01-05\t4\n1970-02-03\t33\n1970-02-04\t34") res = instance.query("SELECT * FROM test.tbl2 ORDER BY p") assert TSV(res) == expected copy_backup_to_detached(started_cluster.instances["node"], "test", "tbl", "tbl2") # The data_version of parts to be attached # - may be less than, equal to or larger than the current table's data_version. # - may intersect with the existing parts of a partition. instance.query("ALTER TABLE test.tbl2 ATTACH PARTITION 197001") instance.query("ALTER TABLE test.tbl2 ATTACH PARTITION 197002") instance.query("SELECT sleep(2)") expected = TSV( "1970-01-02\t1\n1970-01-03\t2\n1970-01-04\t3\n1970-01-04\t3\n1970-01-05\t4\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33\n1970-02-03\t33\n1970-02-04\t34" ) res = instance.query("SELECT * FROM test.tbl2 ORDER BY p") assert TSV(res) == expected instance.query("ALTER TABLE test.tbl2 UPDATE k=10 WHERE 1") instance.query("SELECT sleep(2)") # Validate mutation has been applied to all attached parts. expected = TSV( "1970-01-02\t10\n1970-01-03\t10\n1970-01-04\t10\n1970-01-04\t10\n1970-01-05\t10\n1970-02-01\t10\n1970-02-02\t10\n1970-02-03\t10\n1970-02-03\t10\n1970-02-04\t10" ) res = instance.query("SELECT * FROM test.tbl2 ORDER BY p") assert TSV(res) == expected instance.query("DROP TABLE IF EXISTS test.tbl2") def test_replace_partition(started_cluster): instance.query("CREATE TABLE test.tbl3 AS test.tbl") for i in range(3, 5): instance.query( "INSERT INTO test.tbl3(p, k) VALUES(toDate({}), {})".format(i, i) ) for i in range(33, 35): instance.query( "INSERT INTO test.tbl3(p, k) VALUES(toDate({}), {})".format(i, i) ) expected = TSV("1970-01-04\t3\n1970-01-05\t4\n1970-02-03\t33\n1970-02-04\t34") res = instance.query("SELECT * FROM test.tbl3 ORDER BY p") assert TSV(res) == expected copy_backup_to_detached(started_cluster.instances["node"], "test", "tbl", "tbl3") # The data_version of parts to be copied # - may be less than, equal to or larger than the current table data_version. # - may intersect with the existing parts of a partition. instance.query("ALTER TABLE test.tbl3 REPLACE PARTITION 197002 FROM test.tbl") instance.query("SELECT sleep(2)") expected = TSV( "1970-01-04\t3\n1970-01-05\t4\n1970-02-01\t31\n1970-02-02\t32\n1970-02-03\t33" ) res = instance.query("SELECT * FROM test.tbl3 ORDER BY p") assert TSV(res) == expected instance.query("ALTER TABLE test.tbl3 UPDATE k=10 WHERE 1") instance.query("SELECT sleep(2)") # Validate mutation has been applied to all copied parts. expected = TSV( "1970-01-04\t10\n1970-01-05\t10\n1970-02-01\t10\n1970-02-02\t10\n1970-02-03\t10" ) res = instance.query("SELECT * FROM test.tbl3 ORDER BY p") assert TSV(res) == expected instance.query("DROP TABLE IF EXISTS test.tbl3") def test_freeze_in_memory(started_cluster): instance.query( "CREATE TABLE test.t_in_memory(a UInt32, s String) ENGINE = MergeTree ORDER BY a SETTINGS min_rows_for_compact_part = 1000" ) instance.query("INSERT INTO test.t_in_memory VALUES (1, 'a')") instance.query("ALTER TABLE test.t_in_memory FREEZE") fp_backup = get_last_backup_path( started_cluster.instances["node"], "test", "t_in_memory" ) part_path = fp_backup + "/all_1_1_0/" assert TSV( instance.query( "SELECT part_type, is_frozen FROM system.parts WHERE database = 'test' AND table = 't_in_memory'" ) ) == TSV("InMemory\t1\n") instance.exec_in_container(["test", "-f", part_path + "/data.bin"]) assert instance.exec_in_container(["cat", part_path + "/count.txt"]).strip() == "1" instance.query( "CREATE TABLE test.t_in_memory_2(a UInt32, s String) ENGINE = MergeTree ORDER BY a" ) copy_backup_to_detached( started_cluster.instances["node"], "test", "t_in_memory", "t_in_memory_2" ) instance.query("ALTER TABLE test.t_in_memory_2 ATTACH PARTITION ID 'all'") assert TSV( instance.query( "SELECT part_type FROM system.parts WHERE database = 'test' AND table = 't_in_memory_2'" ) ) == TSV("Compact\n") assert TSV(instance.query("SELECT a, s FROM test.t_in_memory_2")) == TSV("1\ta\n")