ClickHouse/tests/queries/0_stateless/03241_orc_dictionary_encode.sql
2024-10-15 16:10:13 +08:00

39 lines
2.6 KiB
SQL

-- Tags: no-fasttest
set input_format_orc_use_fast_decoder = 1;
set input_format_orc_dictionary_as_low_cardinality = 1;
insert into function file(concat(currentDatabase(), '_03241_data1_without_dict.orc'))
select toLowCardinality(cast(if (number % 10 = 0, null, number % 10) as Nullable(String))) as c from numbers(100000)
settings output_format_orc_dictionary_key_size_threshold = 0, engine_file_truncate_on_insert = 1;
insert into function file(concat(currentDatabase(), '_03241_data1_with_dict.orc'))
select toLowCardinality(cast(if (number % 10 = 0, null, number % 10) as Nullable(String))) as c from numbers(100000)
settings output_format_orc_dictionary_key_size_threshold = 0.1, engine_file_truncate_on_insert = 1;
desc file(concat(currentDatabase(), '_03241_data1_without_dict.orc'));
desc file(concat(currentDatabase(), '_03241_data1_with_dict.orc'));
select c, count(1) from file(concat(currentDatabase(), '_03241_data1_without_dict.orc')) group by c order by c;
select c, count(1) from file(concat(currentDatabase(), '_03241_data1_with_dict.orc')) group by c order by c;
select c, count(1) from file(concat(currentDatabase(), '_03241_data1_without_dict.orc'), ORC, 'c String') group by c order by c;
select c, count(1) from file(concat(currentDatabase(), '_03241_data1_with_dict.orc'), ORC, 'c LowCardinality(String)') group by c order by c;
set input_format_orc_dictionary_as_low_cardinality = 0;
insert into function file(concat(currentDatabase(), '_03241_data2_without_dict.orc'))
select toLowCardinality(cast(if (number % 10 = 0, null, number % 10) as Nullable(String))) as c from numbers(100000)
settings output_format_orc_dictionary_key_size_threshold = 0, engine_file_truncate_on_insert = 1;
insert into function file(concat(currentDatabase(), '_03241_data2_with_dict.orc'))
select toLowCardinality(cast(if (number % 10 = 0, null, number % 10) as Nullable(String))) as c from numbers(100000)
settings output_format_orc_dictionary_key_size_threshold = 0.1, engine_file_truncate_on_insert = 1;
desc file(concat(currentDatabase(), '_03241_data2_without_dict.orc'));
desc file(concat(currentDatabase(), '_03241_data2_with_dict.orc'));
select c, count(1) from file(concat(currentDatabase(), '_03241_data2_without_dict.orc')) group by c order by c;
select c, count(1) from file(concat(currentDatabase(), '_03241_data2_with_dict.orc')) group by c order by c;
select c, count(1) from file(concat(currentDatabase(), '_03241_data2_without_dict.orc'), ORC, 'c String') group by c order by c;
select c, count(1) from file(concat(currentDatabase(), '_03241_data2_with_dict.orc'), ORC, 'c LowCardinality(String)') group by c order by c;