ClickHouse/tests/integration/test_filesystem_layout/test.py
2024-09-27 10:19:49 +00:00

176 lines
4.9 KiB
Python

from pathlib import Path
import pytest
from helpers.cluster import ClickHouseCluster
cluster = ClickHouseCluster(__file__)
node = cluster.add_instance(
"node",
main_configs=[
"configs/config.d/storage_configuration.xml",
],
with_minio=True,
stay_alive=True,
)
@pytest.fixture(scope="module")
def started_cluster():
try:
cluster.start()
yield cluster
finally:
cluster.shutdown()
def test_file_path_escaping(started_cluster):
node.query(
"CREATE DATABASE IF NOT EXISTS test ENGINE = Ordinary",
settings={"allow_deprecated_database_ordinary": 1},
)
node.query(
"""
CREATE TABLE test.`T.a_b,l-e!` (`~Id` UInt32)
ENGINE = MergeTree() PARTITION BY `~Id` ORDER BY `~Id` SETTINGS min_bytes_for_wide_part = 0, replace_long_file_name_to_hash = 0;
"""
)
node.query("""INSERT INTO test.`T.a_b,l-e!` VALUES (1);""")
node.query("""ALTER TABLE test.`T.a_b,l-e!` FREEZE;""")
node.exec_in_container(
[
"bash",
"-c",
"test -f /var/lib/clickhouse/data/test/T%2Ea_b%2Cl%2De%21/1_1_1_0/%7EId.bin",
]
)
node.exec_in_container(
[
"bash",
"-c",
"test -f /var/lib/clickhouse/shadow/1/data/test/T%2Ea_b%2Cl%2De%21/1_1_1_0/%7EId.bin",
]
)
node.query("CREATE DATABASE IF NOT EXISTS `test 2` ENGINE = Atomic")
node.query(
"""
CREATE TABLE `test 2`.`T.a_b,l-e!` UUID '12345678-1000-4000-8000-000000000001' (`~Id` UInt32)
ENGINE = MergeTree() PARTITION BY `~Id` ORDER BY `~Id` SETTINGS min_bytes_for_wide_part = 0, replace_long_file_name_to_hash = 0;
"""
)
node.query("""INSERT INTO `test 2`.`T.a_b,l-e!` VALUES (1);""")
node.query("""ALTER TABLE `test 2`.`T.a_b,l-e!` FREEZE;""")
node.exec_in_container(
[
"bash",
"-c",
"test -f /var/lib/clickhouse/store/123/12345678-1000-4000-8000-000000000001/1_1_1_0/%7EId.bin",
]
)
# Check symlink
node.exec_in_container(
["bash", "-c", "test -L /var/lib/clickhouse/data/test%202/T%2Ea_b%2Cl%2De%21"]
)
node.exec_in_container(
[
"bash",
"-c",
"test -f /var/lib/clickhouse/data/test%202/T%2Ea_b%2Cl%2De%21/1_1_1_0/%7EId.bin",
]
)
node.exec_in_container(
[
"bash",
"-c",
"test -f /var/lib/clickhouse/shadow/2/store/123/12345678-1000-4000-8000-000000000001/1_1_1_0/%7EId.bin",
]
)
node.query("DROP TABLE test.`T.a_b,l-e!` SYNC")
node.query("DROP TABLE `test 2`.`T.a_b,l-e!` SYNC")
node.query("DROP DATABASE test")
node.query("DROP DATABASE `test 2`")
def test_data_directory_symlinks(started_cluster):
node.query("CREATE DATABASE IF NOT EXISTS test_symlinks ENGINE = Atomic")
node.query(
sql="""
CREATE TABLE test_symlinks.default UUID '87654321-1000-4000-8000-000000000001'
(Id UInt32)
ENGINE = MergeTree()
PARTITION BY Id
ORDER BY Id
""",
database="test_symlinks",
)
node.query(
"""
CREATE TABLE test_symlinks.s3 UUID '87654321-1000-4000-8000-000000000002'
(Id UInt32)
ENGINE = MergeTree()
PARTITION BY Id
ORDER BY Id
SETTINGS storage_policy = 's3'
"""
)
node.query(
"""
CREATE TABLE test_symlinks.jbod UUID '87654321-1000-4000-8000-000000000003'
(Id UInt32)
ENGINE = MergeTree()
PARTITION BY Id
ORDER BY Id
SETTINGS storage_policy = 'jbod'
"""
)
clickhouse_dir = Path("/var/lib/clickhouse/")
database_dir = clickhouse_dir / "data" / "test_symlinks"
default_symlink = database_dir / "default"
s3_symlink = database_dir / "s3"
jbod_symlink = database_dir / "jbod"
default_data = (
clickhouse_dir / "store" / "876" / "87654321-1000-4000-8000-000000000001"
)
s3_data = (
clickhouse_dir
/ "disks"
/ "s3"
/ "store"
/ "876"
/ "87654321-1000-4000-8000-000000000002"
)
jbod_data = Path("jbod1") / "store" / "876" / "87654321-1000-4000-8000-000000000003"
node.restart_clickhouse()
assert (
node.exec_in_container(["bash", "-c", f"ls -l {default_symlink}"])
.strip()
.endswith(f"{default_symlink} -> {default_data}")
)
assert (
node.exec_in_container(["bash", "-c", f"ls -l {s3_symlink}"])
.strip()
.endswith(f"{s3_symlink} -> {s3_data}")
)
assert (
node.exec_in_container(["bash", "-c", f"ls -l {jbod_symlink}"])
.strip()
.endswith(f"{jbod_symlink} -> /{jbod_data}")
)
node.query("DROP TABLE test_symlinks.default SYNC")
node.query("DROP TABLE test_symlinks.s3 SYNC")
node.query("DROP TABLE test_symlinks.jbod SYNC")
node.query("DROP DATABASE test_symlinks")