ClickHouse/tests/integration/test_compression_nested_columns/test.py

117 lines
3.3 KiB
Python
Raw Normal View History

2020-09-22 13:16:42 +00:00
import random
import string
import pytest
2024-09-27 10:19:39 +00:00
2020-09-22 13:16:42 +00:00
from helpers.cluster import ClickHouseCluster
cluster = ClickHouseCluster(__file__)
node1 = cluster.add_instance("node1", with_zookeeper=True)
node2 = cluster.add_instance("node2", with_zookeeper=True)
2020-09-22 13:16:42 +00:00
@pytest.fixture(scope="module")
def start_cluster():
try:
cluster.start()
yield cluster
finally:
cluster.shutdown()
2020-09-22 13:16:42 +00:00
def get_compression_codec_byte(node, table_name, part_name, filename):
cmd = "tail -c +17 /var/lib/clickhouse/data/default/{}/{}/{}.bin | od -x -N 1 | head -n 1 | awk '{{print $2}}'".format(
table_name, part_name, filename
)
2020-09-22 13:16:42 +00:00
return node.exec_in_container(["bash", "-c", cmd]).strip()
2020-09-22 13:16:42 +00:00
CODECS_MAPPING = {
"NONE": "0002",
"LZ4": "0082",
"LZ4HC": "0082", # not an error, same byte
"ZSTD": "0090",
"Multiple": "0091",
"Delta": "0092",
"T64": "0093",
2020-09-22 13:16:42 +00:00
}
2020-09-22 13:16:42 +00:00
def test_nested_compression_codec(start_cluster):
for i, node in enumerate([node1, node2]):
node.query(
"""
2020-09-22 13:16:42 +00:00
CREATE TABLE compression_table (
key UInt64,
column_ok Nullable(UInt64) CODEC(Delta, LZ4),
column_array Array(Array(UInt64)) CODEC(T64, LZ4),
column_bad LowCardinality(Int64) CODEC(Delta)
) ENGINE = ReplicatedMergeTree('/t', '{}') ORDER BY tuple() PARTITION BY key
2023-08-07 15:00:25 +00:00
SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, replace_long_file_name_to_hash = 0;
""".format(
i
),
settings={
"allow_suspicious_codecs": "1",
"allow_suspicious_low_cardinality_types": "1",
},
)
2020-09-22 13:16:42 +00:00
node1.query("INSERT INTO compression_table VALUES (1, 1, [[77]], 32)")
node2.query("SYSTEM SYNC REPLICA compression_table", timeout=5)
node1.query("DETACH TABLE compression_table")
node2.query("DETACH TABLE compression_table")
node1.query("ATTACH TABLE compression_table")
node2.query("ATTACH TABLE compression_table")
for node in [node1, node2]:
assert (
get_compression_codec_byte(
node, "compression_table", "1_0_0_0", "column_ok"
)
== CODECS_MAPPING["Multiple"]
)
assert (
get_compression_codec_byte(
node, "compression_table", "1_0_0_0", "column_ok.null"
)
== CODECS_MAPPING["LZ4"]
)
assert (
get_compression_codec_byte(
node1, "compression_table", "1_0_0_0", "column_array"
)
== CODECS_MAPPING["Multiple"]
)
assert (
get_compression_codec_byte(
node2, "compression_table", "1_0_0_0", "column_array.size0"
)
== CODECS_MAPPING["LZ4"]
)
assert (
get_compression_codec_byte(
node2, "compression_table", "1_0_0_0", "column_array.size1"
)
== CODECS_MAPPING["LZ4"]
)
assert (
get_compression_codec_byte(
node2, "compression_table", "1_0_0_0", "column_bad.dict"
)
== CODECS_MAPPING["Delta"]
)
assert (
get_compression_codec_byte(
node1, "compression_table", "1_0_0_0", "column_bad"
)
== CODECS_MAPPING["NONE"]
)