Merge branch 'fix-unit-tests' into better-diagnostics-in-functional-tests

2024-09-19 16:20:50 +00:00 · 2024-07-26 04:51:46 +02:00 · 2024-07-26 04:51:46 +02:00 · 8f91fa8b78
commit 8f91fa8b78
parent 782d829d87 d6fdf29679
25 changed files with 87 additions and 716 deletions
--- a/docker/test/fuzzer/query-fuzzer-tweaks-users.xml
+++ b/docker/test/fuzzer/query-fuzzer-tweaks-users.xml
@ -20,7 +20,7 @@
                </max_execution_time>

                <max_memory_usage>
-                    <max>10G</max>
+                    <max>5G</max>
                </max_memory_usage>

                <table_function_remote_max_addresses>
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@ -208,7 +208,6 @@ handle SIGPIPE nostop noprint pass
 handle SIGTERM nostop noprint pass
 handle SIGUSR1 nostop noprint pass
 handle SIGUSR2 nostop noprint pass
-handle SIGSEGV nostop pass
 handle SIG$RTMIN nostop noprint pass
 info signals
 continue
--- a/docker/test/stateless/attach_gdb.lib
+++ b/docker/test/stateless/attach_gdb.lib
@ -20,7 +20,6 @@ handle SIGPIPE nostop noprint pass
 handle SIGTERM nostop noprint pass
 handle SIGUSR1 nostop noprint pass
 handle SIGUSR2 nostop noprint pass
-handle SIGSEGV nostop pass
 handle SIG$RTMIN nostop noprint pass
 info signals
 continue
--- a/src/Common/QueryProfiler.cpp
+++ b/src/Common/QueryProfiler.cpp
@ -33,7 +33,7 @@ namespace DB
 namespace
 {
 #if defined(OS_LINUX)
-    //thread_local size_t write_trace_iteration = 0;
+    thread_local size_t write_trace_iteration = 0;
 #endif
    /// Even after timer_delete() the signal can be delivered,
    /// since it does not do anything with pending signals.
@ -57,7 +57,7 @@ namespace

        auto saved_errno = errno;   /// We must restore previous value of errno in signal handler.

-#if defined(OS_LINUX) && false //asdqwe
+#if defined(OS_LINUX)
        if (info)
        {
            int overrun_count = info->si_overrun;
@ -92,7 +92,7 @@ namespace
        constexpr bool sanitizer = false;
 #endif

-        //asdqwe asynchronous_stack_unwinding = true;
+        asynchronous_stack_unwinding = true;
        if (sanitizer || 0 == sigsetjmp(asynchronous_stack_unwinding_signal_jump_buffer, 1))
        {
            stack_trace.emplace(signal_context);
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@ -1,5 +1,8 @@
 #pragma once

+/// CLion freezes for a minute on every keypress in any file including this.
+#if !defined(__CLION_IDE__)
+
 #include <Common/NamePrompter.h>
 #include <Core/BaseSettings.h>
 #include <Core/SettingsEnums.h>
@ -1347,3 +1350,5 @@ struct FormatFactorySettings : public BaseSettings<FormatFactorySettingsTraits>
 };

 }
+
+#endif
--- a/src/IO/tests/gtest_archive_reader_and_writer.cpp
+++ b/src/IO/tests/gtest_archive_reader_and_writer.cpp
@ -492,48 +492,6 @@ TEST_P(ArchiveReaderAndWriterTest, ManyFilesOnDisk)
    }
 }

-TEST_P(ArchiveReaderAndWriterTest, LargeFile)
-{
-    /// Make an archive.
-    std::string_view contents = "The contents of a.txt\n";
-    int times = 10000000;
-    {
-        auto writer = createArchiveWriter(getPathToArchive());
-        {
-            auto out = writer->writeFile("a.txt", times * contents.size());
-            for (int i = 0; i < times; i++)
-                writeString(contents, *out);
-            out->finalize();
-        }
-        writer->finalize();
-    }
-
-    /// Read the archive.
-    auto reader = createArchiveReader(getPathToArchive());
-
-    ASSERT_TRUE(reader->fileExists("a.txt"));
-
-    auto file_info = reader->getFileInfo("a.txt");
-    EXPECT_EQ(file_info.uncompressed_size, contents.size() * times);
-    EXPECT_GT(file_info.compressed_size, 0);
-
-    {
-        auto in = reader->readFile("a.txt", /*throw_on_not_found=*/true);
-        for (int i = 0; i < times; i++)
-            ASSERT_TRUE(checkString(String(contents), *in));
-    }
-
-    {
-        /// Use an enumerator.
-        auto enumerator = reader->firstFile();
-        ASSERT_NE(enumerator, nullptr);
-        EXPECT_EQ(enumerator->getFileName(), "a.txt");
-        EXPECT_EQ(enumerator->getFileInfo().uncompressed_size, contents.size() * times);
-        EXPECT_GT(enumerator->getFileInfo().compressed_size, 0);
-        EXPECT_FALSE(enumerator->nextFile());
-    }
-}
-
 TEST(TarArchiveReaderTest, FileExists)
 {
    String archive_path = "archive.tar";
--- a/src/Interpreters/ClusterProxy/executeQuery.cpp
+++ b/src/Interpreters/ClusterProxy/executeQuery.cpp
@ -24,7 +24,6 @@
 #include <Processors/Sources/NullSource.h>
 #include <QueryPipeline/Pipe.h>
 #include <Storages/Distributed/DistributedSettings.h>
-#include <Storages/MergeTree/ParallelReplicasReadingCoordinator.h>
 #include <Storages/SelectQueryInfo.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/StorageSnapshot.h>
@ -517,14 +516,11 @@ void executeQueryWithParallelReplicas(
                "`cluster_for_parallel_replicas` setting refers to cluster with several shards. Expected a cluster with one shard");
    }

-    auto coordinator = std::make_shared<ParallelReplicasReadingCoordinator>(
-        new_cluster->getShardsInfo().begin()->getAllNodeCount(), settings.parallel_replicas_mark_segment_size);
    auto external_tables = new_context->getExternalTables();
    auto read_from_remote = std::make_unique<ReadFromParallelRemoteReplicasStep>(
        query_ast,
        new_cluster,
        storage_id,
-        std::move(coordinator),
        header,
        processed_stage,
        new_context,
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@ -21,7 +21,7 @@
 #include <Client/ConnectionPoolWithFailover.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
 #include <Parsers/ASTFunction.h>
-
+#include <Storages/MergeTree/ParallelReplicasReadingCoordinator.h>
 #include <boost/algorithm/string/join.hpp>

 namespace DB
@ -362,7 +362,6 @@ ReadFromParallelRemoteReplicasStep::ReadFromParallelRemoteReplicasStep(
    ASTPtr query_ast_,
    ClusterPtr cluster_,
    const StorageID & storage_id_,
-    ParallelReplicasReadingCoordinatorPtr coordinator_,
    Block header_,
    QueryProcessingStage::Enum stage_,
    ContextMutablePtr context_,
@ -375,7 +374,6 @@ ReadFromParallelRemoteReplicasStep::ReadFromParallelRemoteReplicasStep(
    , cluster(cluster_)
    , query_ast(query_ast_)
    , storage_id(storage_id_)
-    , coordinator(std::move(coordinator_))
    , stage(std::move(stage_))
    , context(context_)
    , throttler(throttler_)
@ -438,6 +436,9 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
        shuffled_pool = shard.pool->getShuffledPools(current_settings, priority_func);
    }

+    coordinator
+        = std::make_shared<ParallelReplicasReadingCoordinator>(max_replicas_to_use, current_settings.parallel_replicas_mark_segment_size);
+
    for (size_t i=0; i < max_replicas_to_use; ++i)
    {
        IConnections::ReplicaInfo replica_info
--- a/src/Processors/QueryPlan/ReadFromRemote.h
+++ b/src/Processors/QueryPlan/ReadFromRemote.h
@ -70,7 +70,6 @@ public:
        ASTPtr query_ast_,
        ClusterPtr cluster_,
        const StorageID & storage_id_,
-        ParallelReplicasReadingCoordinatorPtr coordinator_,
        Block header_,
        QueryProcessingStage::Enum stage_,
        ContextMutablePtr context_,
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@ -596,12 +596,12 @@ Pipe ReadFromSystemNumbersStep::makePipe()
            numbers_storage.step,
            step_between_chunks);

-        if (numbers_storage.limit && i == 0)
+        if (end && i == 0)
        {
-            auto rows_appr = itemCountInRange(numbers_storage.offset, *numbers_storage.limit, numbers_storage.step);
-            if (limit > 0 && limit < rows_appr)
-                rows_appr = query_info_limit;
-            source->addTotalRowsApprox(rows_appr);
+            UInt64 rows_approx = itemCountInRange(numbers_storage.offset, *end, numbers_storage.step);
+            if (limit > 0 && limit < rows_approx)
+                rows_approx = query_info_limit;
+            source->addTotalRowsApprox(rows_approx);
        }

        pipe.addSource(std::move(source));
--- a/tests/integration/test_parallel_replicas_no_replicas/test.py
+++ b/tests/integration/test_parallel_replicas_no_replicas/test.py
@ -33,7 +33,10 @@ def create_tables(cluster, table_name):


@pytest.mark.parametrize("skip_unavailable_shards", [1, 0])
-def test_skip_all_replicas(start_cluster, skip_unavailable_shards):
+@pytest.mark.parametrize("max_parallel_replicas", [2, 3, 100])
+def test_skip_all_replicas(
+    start_cluster, skip_unavailable_shards, max_parallel_replicas
+):
    cluster_name = "test_1_shard_3_unavaliable_replicas"
    table_name = "tt"
    create_tables(cluster_name, table_name)
@ -43,7 +46,7 @@ def test_skip_all_replicas(start_cluster, skip_unavailable_shards):
            f"SELECT key, count() FROM {table_name}  GROUP BY key ORDER BY key",
            settings={
                "allow_experimental_parallel_reading_from_replicas": 2,
-                "max_parallel_replicas": 3,
+                "max_parallel_replicas": max_parallel_replicas,
                "cluster_for_parallel_replicas": cluster_name,
                "skip_unavailable_shards": skip_unavailable_shards,
            },
--- a/tests/integration/test_storage_kerberized_hdfs/configs/hdfs.xml
+++ b/tests/integration/test_storage_kerberized_hdfs/configs/hdfs.xml
@ -1,13 +0,0 @@
-<clickhouse>
-  <hdfs>
-		<hadoop_kerberos_keytab>/tmp/keytab/clickhouse.keytab</hadoop_kerberos_keytab>
-		<hadoop_kerberos_principal>root@TEST.CLICKHOUSE.TECH</hadoop_kerberos_principal>
-		<hadoop_security_authentication>kerberos</hadoop_security_authentication>
-  </hdfs>
-  <hdfs_suser>
-		<hadoop_kerberos_principal>specuser@TEST.CLICKHOUSE.TECH</hadoop_kerberos_principal>
-  </hdfs_suser>
-  <hdfs_dedicatedcachepath>
-		<hadoop_security_kerberos_ticket_cache_path>/tmp/kerb_cache</hadoop_security_kerberos_ticket_cache_path>
-  </hdfs_dedicatedcachepath>
-</clickhouse>
--- a/tests/integration/test_storage_kerberized_hdfs/hdfs_configs/bootstrap.sh
+++ b/tests/integration/test_storage_kerberized_hdfs/hdfs_configs/bootstrap.sh
@ -1,280 +0,0 @@
-#!/bin/bash
-
-: "${HADOOP_PREFIX:=/usr/local/hadoop}"
-
-cat >> $HADOOP_PREFIX/etc/hadoop/hadoop-env.sh <<EOF
-export HADOOP_SECURE_DN_USER=hdfs
-export HADOOP_SECURE_DN_PID_DIR=$HADOOP_PREFIX/pid
-export HADOOP_SECURE_DN_LOG_DIR=$HADOOP_PREFIX/logs/hdfs
-export JSVC_HOME=$HADOOP_PREFIX/sbin
-EOF
-$HADOOP_PREFIX/etc/hadoop/hadoop-env.sh
-
-mkdir -p "${HADOOP_SECURE_DN_PID_DIR}"
-mkdir -p "${HADOOP_SECURE_DN_LOG_DIR}"
-
-rm /tmp/*.pid
-
-# installing libraries if any - (resource urls added comma separated to the ACP system variable)
-cd "${HADOOP_PREFIX}/share/hadoop/common" || exit
-for cp in ${ACP//,/ }; do  echo "== ${cp}"; curl -LO "${cp}" ; done;
-cd - || exit
-
-# altering the core-site configuration
-sed "s/HOSTNAME/${HOSTNAME}/" /usr/local/hadoop/etc/hadoop/core-site.xml.template | grep -v '/configuration' > /usr/local/hadoop/etc/hadoop/core-site.xml
-
-cat >> /usr/local/hadoop/etc/hadoop/core-site.xml << EOF
-  <property>
-    <name>hadoop.security.authentication</name>
-    <value>kerberos</value> <!-- A value of "simple" would disable security. -->
-  </property>
-   <property>
-     <name>hadoop.security.authorization</name>
-     <value>true</value>
-   </property>
-  <property>
-    <name>fs.defaultFS</name>
-    <value>hdfs://kerberizedhdfs1:9010</value>
-  </property>
-  <property>
-    <name>fs.default.name</name>
-    <value>hdfs://kerberizedhdfs1:9010</value>
-  </property>
-  <!--
-  <property>
-      <name>hadoop.rpc.protection</name>
-      <value>privacy</value>
-  </property>
-  -->
-</configuration>
-EOF
-
-
-cat > /usr/local/hadoop/etc/hadoop/hdfs-site.xml << EOF
-<configuration>
-<!--
-<property>
-	<name>dfs.permissions.enabled</name>
-	<value>false</value>
-</property>
-->
-<property>
-  <name>dfs.replication</name>
-  <value>1</value>
-</property>
-<!-- General HDFS security config -->
-<property>
-  <name>dfs.block.access.token.enable</name>
-  <value>true</value>
-</property>
-<!-- NameNode security config -->
-<property>
-  <name>dfs.namenode.keytab.file</name>
-  <value>/usr/local/hadoop/etc/hadoop/conf/hdfs.keytab</value> <!-- path to the HDFS keytab -->
-</property>
-<property>
-  <name>dfs.namenode.kerberos.principal</name>
-  <value>hdfs/_HOST@TEST.CLICKHOUSE.TECH</value>
-</property>
-<property>
-  <name>dfs.namenode.kerberos.internal.spnego.principal</name>
-  <value>HTTP/_HOST@TEST.CLICKHOUSE.TECH</value>
-</property>
-<!-- Secondary NameNode security config -->
-<property>
-  <name>dfs.secondary.namenode.keytab.file</name>
-  <value>/usr/local/hadoop/etc/hadoop/conf/hdfs.keytab</value> <!-- path to the HDFS keytab -->
-</property>
-<property>
-  <name>dfs.secondary.namenode.kerberos.principal</name>
-  <value>hdfs/_HOST@TEST.CLICKHOUSE.TECH</value>
-</property>
-<property>
-  <name>dfs.secondary.namenode.kerberos.internal.spnego.principal</name>
-  <value>HTTP/_HOST@TEST.CLICKHOUSE.TECH</value>
-</property>
-<!-- DataNode security config
-<property>
-   <name>dfs.data.transfer.protectionл</name>
-   <value>integrity</value>
-</property>
-->
-<property>
-  <name>dfs.datanode.data.dir.perm</name>
-  <value>700</value>
-</property>
-<property>
-  <name>dfs.datanode.address</name>
-  <value>0.0.0.0:1004</value>
-</property>
-<property>
-  <name>dfs.datanode.http.address</name>
-  <value>0.0.0.0:1006</value>
-</property>
-<!-- If the port is 0 then the server will start on a free port. -->
-<property>
-  <name>dfs.datanode.ipc.address</name>
-  <value>0.0.0.0:0</value>
-</property>
-<property>
-  <name>dfs.namenode.secondary.http-address</name>
-  <value>0.0.0.0:0</value>
-</property>
-<property>
-  <name>dfs.namenode.backup.address</name>
-  <value>0.0.0.0:0</value>
-</property>
-<property>
-  <name>dfs.namenode.backup.http-address</name>
-  <value>0.0.0.0:0</value>
-</property>
-<!--
-<property>
-  <name>dfs.http.policy</name>
-  <value>HTTPS_ONLY</value>
-</property>
-->
-
-
-<property>
-  <name>dfs.datanode.keytab.file</name>
-  <value>/usr/local/hadoop/etc/hadoop/conf/hdfs.keytab</value> <!-- path to the HDFS keytab -->
-</property>
-<property>
-  <name>dfs.datanode.kerberos.principal</name>
-  <value>hdfs/_HOST@TEST.CLICKHOUSE.TECH</value>
-</property>
-
-<!-- Web Authentication config -->
-<property>
-    <name>dfs.webhdfs.enabled</name>
-    <value>true</value>
-</property>
-<property>
-<name>dfs.encrypt.data.transfer</name>
-<value>false</value>
-</property>
-<property>
-  <name>dfs.web.authentication.kerberos.principal</name>
-  <value>HTTP/_HOST@TEST.CLICKHOUSE.TECH</value>
-</property>
-<property>
-    <name>dfs.web.authentication.kerberos.keytab</name>
-  <value>/usr/local/hadoop/etc/hadoop/conf/hdfs.keytab</value> <!-- path to the HDFS keytab -->
-</property>
-</configuration>
-EOF
-
-
-
-# cat > /usr/local/hadoop/etc/hadoop/ssl-server.xml << EOF
-# <configuration>
-# <property>
-#   <name>ssl.server.truststore.location</name>
-#   <value>/usr/local/hadoop/etc/hadoop/conf/hdfs.jks</value>
-# </property>
-# <property>
-#   <name>ssl.server.truststore.password</name>
-#   <value>masterkey</value>
-# </property>
-# <property>
-#   <name>ssl.server.keystore.location</name>
-#   <value>/usr/local/hadoop/etc/hadoop/conf/hdfs.jks</value>
-# </property>
-# <property>
-#   <name>ssl.server.keystore.password</name>
-#   <value>masterkey</value>
-# </property>
-# <property>
-#   <name>ssl.server.keystore.keypassword</name>
-#   <value>masterkey</value>
-# </property>
-# </configuration>
-# EOF
-
-cat > /usr/local/hadoop/etc/hadoop/log4j.properties << EOF
-# Set everything to be logged to the console
-log4j.rootCategory=DEBUG, console
-log4j.appender.console=org.apache.log4j.ConsoleAppender
-log4j.appender.console.target=System.err
-log4j.appender.console.layout=org.apache.log4j.PatternLayout
-log4j.appender.console.layout.ConversionPattern=%d{yy/MM/dd HH:mm:ss} %p %c{1}: %m%n
-
-# Set the default spark-shell log level to WARN. When running the spark-shell, the
-# log level for this class is used to overwrite the root logger's log level, so that
-# the user can have different defaults for the shell and regular Spark apps.
-log4j.logger.org.apache.spark.repl.Main=INFO
-
-# Settings to quiet third party logs that are too verbose
-log4j.logger.org.spark_project.jetty=DEBUG
-log4j.logger.org.spark_project.jetty.util.component.AbstractLifeCycle=ERROR
-log4j.logger.org.apache.spark.repl.SparkIMain$exprTyper=INFO
-log4j.logger.org.apache.spark.repl.SparkILoop$SparkILoopInterpreter=INFO
-log4j.logger.org.apache.parquet=ERROR
-log4j.logger.parquet=ERROR
-
-# SPARK-9183: Settings to avoid annoying messages when looking up nonexistent UDFs in SparkSQL with Hive support
-log4j.logger.org.apache.hadoop.hive.metastore.RetryingHMSHandler=FATAL
-log4j.logger.org.apache.hadoop.hive.ql.exec.FunctionRegistry=ERROR
-
-log4j.logger.org.apache.spark.deploy=DEBUG
-log4j.logger.org.apache.spark.executor=DEBUG
-log4j.logger.org.apache.spark.scheduler=DEBUG
-EOF
-
-useradd -u 1098 hdfs
-
-# keytool -genkey -alias kerberized_hdfs1.test.clickhouse.com -keyalg rsa -keysize 1024 -dname "CN=kerberized_hdfs1.test.clickhouse.com" -keypass masterkey -keystore /usr/local/hadoop/etc/hadoop/conf/hdfs.jks -storepass masterkey
-keytool -genkey -alias kerberizedhdfs1 -keyalg rsa -keysize 1024 -dname "CN=kerberizedhdfs1" -keypass masterkey -keystore /usr/local/hadoop/etc/hadoop/conf/hdfs.jks -storepass masterkey
-
-chmod g+r /usr/local/hadoop/etc/hadoop/conf/hdfs.jks
-
-
-service sshd start
-
-# yum --quiet --assumeyes install krb5-workstation.x86_64
-# yum --quiet --assumeyes install tcpdump
-
-# cd /tmp
-# curl http://archive.apache.org/dist/commons/daemon/source/commons-daemon-1.0.15-src.tar.gz   -o  commons-daemon-1.0.15-src.tar.gz
-# tar xzf commons-daemon-1.0.15-src.tar.gz
-# cd commons-daemon-1.0.15-src/src/native/unix
-# ./configure && make
-# cp ./jsvc /usr/local/hadoop/sbin
-
-
-until kinit -kt /usr/local/hadoop/etc/hadoop/conf/hdfs.keytab hdfs/kerberizedhdfs1@TEST.CLICKHOUSE.TECH; do sleep 2; done
-echo "KDC is up and ready to go... starting up"
-
-$HADOOP_PREFIX/sbin/start-dfs.sh
-$HADOOP_PREFIX/sbin/start-yarn.sh
-$HADOOP_PREFIX/sbin/mr-jobhistory-daemon.sh start historyserver
-
-chmod a+r /usr/local/hadoop/etc/hadoop/conf/hdfs.keytab   # create dedicated keytab for hdfsuser
-
-$HADOOP_PREFIX/sbin/start-secure-dns.sh
-sleep 3
-
-/usr/local/hadoop/bin/hdfs dfsadmin -safemode leave
-
-/usr/local/hadoop/bin/hdfs dfs -mkdir /user/specuser
-/usr/local/hadoop/bin/hdfs dfs -chown specuser /user/specuser
-echo "chown_completed" | /usr/local/hadoop/bin/hdfs dfs -appendToFile - /preparations_done_marker
-
-kdestroy
-
-
-
-# adduser --groups hdfs hdfsuser
-
-# /usr/local/hadoop/sbin/hadoop-daemon.sh --config /usr/local/hadoop/etc/hadoop/ --script /usr/local/hadoop/sbin/hdfs start namenode
-# /usr/local/hadoop/sbin/hadoop-daemon.sh --config /usr/local/hadoop/etc/hadoop/ --script /usr/local/hadoop/sbin/hdfs start datanode
-
-
-if [[ $1 == "-d" ]]; then
-  while true; do sleep 1000; done
-fi
-
-if [[ $1 == "-bash" ]]; then
-  /bin/bash
-fi
--- a/tests/integration/test_storage_kerberized_hdfs/kerberos_image_config.sh
+++ b/tests/integration/test_storage_kerberized_hdfs/kerberos_image_config.sh
@ -1,140 +0,0 @@
-#!/bin/bash
-
-
-set -x  #  trace
-
-: "${REALM:=TEST.CLICKHOUSE.TECH}"
-: "${DOMAIN_REALM:=test.clickhouse.com}"
-: "${KERB_MASTER_KEY:=masterkey}"
-: "${KERB_ADMIN_USER:=admin}"
-: "${KERB_ADMIN_PASS:=admin}"
-
-create_config() {
-  : "${KDC_ADDRESS:=$(hostname -f)}"
-
-  cat>/etc/krb5.conf<<EOF
-[logging]
- default = FILE:/var/log/kerberos/krb5libs.log
- kdc = FILE:/var/log/kerberos/krb5kdc.log
- admin_server = FILE:/var/log/kerberos/kadmind.log
-
-[libdefaults]
- default_realm = $REALM
- dns_lookup_realm = false
- dns_lookup_kdc = false
- ticket_lifetime = 15d
- renew_lifetime = 15d
- forwardable = true
- # WARNING: We use weaker key types to simplify testing as stronger key types
- # require the enhanced security JCE policy file to be installed. You should
- # NOT run with this configuration in production or any real environment. You
- # have been warned.
- default_tkt_enctypes = des-cbc-md5 des-cbc-crc des3-cbc-sha1
- default_tgs_enctypes = des-cbc-md5 des-cbc-crc des3-cbc-sha1
- permitted_enctypes = des-cbc-md5 des-cbc-crc des3-cbc-sha1
-
-[realms]
- $REALM = {
-  kdc = $KDC_ADDRESS
-  admin_server = $KDC_ADDRESS
- }
-
-[domain_realm]
- .$DOMAIN_REALM = $REALM
- $DOMAIN_REALM = $REALM
-EOF
-
-cat>/var/kerberos/krb5kdc/kdc.conf<<EOF
-[kdcdefaults]
- kdc_ports = 88
- kdc_tcp_ports = 88
-
-[realms]
- $REALM = {
-  acl_file = /var/kerberos/krb5kdc/kadm5.acl
-  dict_file = /usr/share/dict/words
-  admin_keytab = /var/kerberos/krb5kdc/kadm5.keytab
-  # WARNING: We use weaker key types to simplify testing as stronger key types
-  # require the enhanced security JCE policy file to be installed. You should
-  # NOT run with this configuration in production or any real environment. You
-  # have been warned.
-  master_key_type = des3-hmac-sha1
-  supported_enctypes = arcfour-hmac:normal des3-hmac-sha1:normal des-cbc-crc:normal des:normal des:v4 des:norealm des:onlyrealm des:afs3
-  default_principal_flags = +preauth
- }
-EOF
-}
-
-create_db() {
-  /usr/sbin/kdb5_util -P $KERB_MASTER_KEY -r $REALM create -s
-}
-
-start_kdc() {
-  mkdir -p /var/log/kerberos
-
-  /etc/rc.d/init.d/krb5kdc start
-  /etc/rc.d/init.d/kadmin start
-
-  chkconfig krb5kdc on
-  chkconfig kadmin on
-}
-
-restart_kdc() {
-  /etc/rc.d/init.d/krb5kdc restart
-  /etc/rc.d/init.d/kadmin restart
-}
-
-create_admin_user() {
-  kadmin.local -q "addprinc -pw $KERB_ADMIN_PASS $KERB_ADMIN_USER/admin"
-  echo "*/admin@$REALM *" > /var/kerberos/krb5kdc/kadm5.acl
-}
-
-create_keytabs() {
-  rm /tmp/keytab/*.keytab
-
-
-  # kadmin.local -q "addprinc -randkey hdfs/kerberizedhdfs1.${DOMAIN_REALM}@${REALM}"
-  # kadmin.local -q "ktadd -norandkey -k /tmp/keytab/hdfs.keytab hdfs/kerberizedhdfs1.${DOMAIN_REALM}@${REALM}"
-
-  # kadmin.local -q "addprinc -randkey HTTP/kerberizedhdfs1.${DOMAIN_REALM}@${REALM}"
-  # kadmin.local -q "ktadd -norandkey -k /tmp/keytab/hdfs.keytab HTTP/kerberizedhdfs1.${DOMAIN_REALM}@${REALM}"
-  kadmin.local -q "addprinc -randkey hdfs/kerberizedhdfs1@${REALM}"
-  kadmin.local -q "ktadd -norandkey -k /tmp/keytab/hdfs.keytab hdfs/kerberizedhdfs1@${REALM}"
-
-  kadmin.local -q "addprinc -randkey HTTP/kerberizedhdfs1@${REALM}"
-  kadmin.local -q "ktadd -norandkey -k /tmp/keytab/hdfs.keytab HTTP/kerberizedhdfs1@${REALM}"
-
-  kadmin.local -q "addprinc -randkey hdfsuser/node1@${REALM}"
-  kadmin.local -q "ktadd -norandkey -k /tmp/keytab/clickhouse.keytab hdfsuser/node1@${REALM}"
-  kadmin.local -q "addprinc -randkey hdfsuser@${REALM}"
-  kadmin.local -q "ktadd -norandkey -k /tmp/keytab/clickhouse.keytab hdfsuser@${REALM}"
-  kadmin.local -q "addprinc -randkey root@${REALM}"
-  kadmin.local -q "ktadd -norandkey -k /tmp/keytab/clickhouse.keytab root@${REALM}"
-  kadmin.local -q "addprinc -randkey specuser@${REALM}"
-  kadmin.local -q "ktadd -norandkey -k /tmp/keytab/clickhouse.keytab specuser@${REALM}"
-
-  chmod g+r /tmp/keytab/clickhouse.keytab
-}
-
-main() {
-
-  if [ ! -f /kerberos_initialized ]; then
-    create_config
-    create_db
-    create_admin_user
-    start_kdc
-
-    touch /kerberos_initialized
-  fi
-
-  if [ ! -f /var/kerberos/krb5kdc/principal ]; then
-    while true; do sleep 1000; done
-  else
-    start_kdc
-		create_keytabs
-    tail -F /var/log/kerberos/krb5kdc.log
-  fi
-
-}
-
-[[ "$0" == "${BASH_SOURCE[0]}" ]] && main "$@"
--- a/tests/integration/test_storage_kerberized_hdfs/secrets/krb.conf
+++ b/tests/integration/test_storage_kerberized_hdfs/secrets/krb.conf
@ -1,25 +0,0 @@
-[logging]
- default = FILE:/var/log/krb5libs.log
- kdc = FILE:/var/log/krb5kdc.log
- admin_server = FILE:/var/log/kadmind.log
-
-[libdefaults]
- default_realm = TEST.CLICKHOUSE.TECH
- dns_lookup_realm = false
- dns_lookup_kdc = false
- ticket_lifetime = 5s
- forwardable = true
- rdns = false
- default_tgs_enctypes = des3-hmac-sha1
- default_tkt_enctypes = des3-hmac-sha1
- permitted_enctypes = des3-hmac-sha1
-
-[realms]
- TEST.CLICKHOUSE.TECH = {
-  kdc = hdfskerberos
-  admin_server = hdfskerberos
- }
-
-[domain_realm]
- .test.clickhouse.com = TEST.CLICKHOUSE.TECH
- test.clickhouse.com = TEST.CLICKHOUSE.TECH
--- a/tests/integration/test_storage_kerberized_hdfs/secrets/krb_long.conf
+++ b/tests/integration/test_storage_kerberized_hdfs/secrets/krb_long.conf
@ -1,24 +0,0 @@
-[logging]
- default = FILE:/var/log/krb5libs.log
- kdc = FILE:/var/log/krb5kdc.log
- admin_server = FILE:/var/log/kadmind.log
-
-[libdefaults]
- default_realm = TEST.CLICKHOUSE.TECH
- dns_lookup_realm = false
- dns_lookup_kdc = false
- ticket_lifetime = 15d
- forwardable = true
- default_tgs_enctypes = des3-hmac-sha1
- default_tkt_enctypes = des3-hmac-sha1
- permitted_enctypes = des3-hmac-sha1
-
-[realms]
- TEST.CLICKHOUSE.TECH = {
-  kdc = hdfskerberos
-  admin_server = hdfskerberos
- }
-
-[domain_realm]
- .test.clickhouse.com = TEST.CLICKHOUSE.TECH
- test.clickhouse.com = TEST.CLICKHOUSE.TECH
--- a/tests/integration/test_storage_kerberized_hdfs/test.py
+++ b/tests/integration/test_storage_kerberized_hdfs/test.py
@ -1,155 +0,0 @@
-import time
-import pytest
-
-import os
-
-from helpers.cluster import ClickHouseCluster, is_arm
-import subprocess
-
-if is_arm():
-    pytestmark = pytest.mark.skip
-
-cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance(
-    "node1",
-    with_kerberized_hdfs=True,
-    user_configs=[],
-    main_configs=["configs/hdfs.xml"],
-)
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    try:
-        cluster.start()
-
-        yield cluster
-
-    except Exception as ex:
-        print(ex)
-        raise ex
-    finally:
-        cluster.shutdown()
-
-
-def test_read_table(started_cluster):
-    hdfs_api = started_cluster.hdfs_api
-
-    data = "1\tSerialize\t555.222\n2\tData\t777.333\n"
-    hdfs_api.write_data("/simple_table_function", data)
-
-    api_read = hdfs_api.read_data("/simple_table_function")
-    assert api_read == data
-
-    select_read = node1.query(
-        "select * from hdfs('hdfs://kerberizedhdfs1:9010/simple_table_function', 'TSV', 'id UInt64, text String, number Float64')"
-    )
-    assert select_read == data
-
-
-def test_read_write_storage(started_cluster):
-    hdfs_api = started_cluster.hdfs_api
-
-    node1.query(
-        "create table SimpleHDFSStorage2 (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://kerberizedhdfs1:9010/simple_storage1', 'TSV')"
-    )
-    node1.query("insert into SimpleHDFSStorage2 values (1, 'Mark', 72.53)")
-
-    api_read = hdfs_api.read_data("/simple_storage1")
-    assert api_read == "1\tMark\t72.53\n"
-
-    select_read = node1.query("select * from SimpleHDFSStorage2")
-    assert select_read == "1\tMark\t72.53\n"
-
-
-def test_write_storage_not_expired(started_cluster):
-    hdfs_api = started_cluster.hdfs_api
-
-    node1.query(
-        "create table SimpleHDFSStorageNotExpired (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://kerberizedhdfs1:9010/simple_storage_not_expired', 'TSV')"
-    )
-
-    time.sleep(15)  # wait for ticket expiration
-    node1.query("insert into SimpleHDFSStorageNotExpired values (1, 'Mark', 72.53)")
-
-    api_read = hdfs_api.read_data("/simple_storage_not_expired")
-    assert api_read == "1\tMark\t72.53\n"
-
-    select_read = node1.query("select * from SimpleHDFSStorageNotExpired")
-    assert select_read == "1\tMark\t72.53\n"
-
-
-def test_two_users(started_cluster):
-    hdfs_api = started_cluster.hdfs_api
-
-    node1.query(
-        "create table HDFSStorOne (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://kerberizedhdfs1:9010/storage_user_one', 'TSV')"
-    )
-    node1.query("insert into HDFSStorOne values (1, 'Real', 86.00)")
-
-    node1.query(
-        "create table HDFSStorTwo (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://suser@kerberizedhdfs1:9010/user/specuser/storage_user_two', 'TSV')"
-    )
-    node1.query("insert into HDFSStorTwo values (1, 'Ideal', 74.00)")
-
-    select_read_1 = node1.query(
-        "select * from hdfs('hdfs://kerberizedhdfs1:9010/user/specuser/storage_user_two', 'TSV', 'id UInt64, text String, number Float64')"
-    )
-
-    select_read_2 = node1.query(
-        "select * from hdfs('hdfs://suser@kerberizedhdfs1:9010/storage_user_one', 'TSV', 'id UInt64, text String, number Float64')"
-    )
-
-
-def test_read_table_expired(started_cluster):
-    hdfs_api = started_cluster.hdfs_api
-
-    data = "1\tSerialize\t555.222\n2\tData\t777.333\n"
-    hdfs_api.write_data("/simple_table_function_relogin", data)
-
-    started_cluster.pause_container("hdfskerberos")
-    time.sleep(15)
-
-    try:
-        select_read = node1.query(
-            "select * from hdfs('hdfs://reloginuser&kerberizedhdfs1:9010/simple_table_function', 'TSV', 'id UInt64, text String, number Float64')"
-        )
-        assert False, "Exception have to be thrown"
-    except Exception as ex:
-        assert "DB::Exception: KerberosInit failure:" in str(ex)
-
-    started_cluster.unpause_container("hdfskerberos")
-
-
-def test_prohibited(started_cluster):
-    node1.query(
-        "create table HDFSStorTwoProhibited (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://suser@kerberizedhdfs1:9010/storage_user_two_prohibited', 'TSV')"
-    )
-    try:
-        node1.query("insert into HDFSStorTwoProhibited values (1, 'SomeOne', 74.00)")
-        assert False, "Exception have to be thrown"
-    except Exception as ex:
-        assert (
-            "Unable to open HDFS file: /storage_user_two_prohibited (hdfs://suser@kerberizedhdfs1:9010/storage_user_two_prohibited) error: Permission denied: user=specuser, access=WRITE"
-            in str(ex)
-        )
-
-
-def test_cache_path(started_cluster):
-    node1.query(
-        "create table HDFSStorCachePath (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://dedicatedcachepath@kerberizedhdfs1:9010/storage_dedicated_cache_path', 'TSV')"
-    )
-    try:
-        node1.query("insert into HDFSStorCachePath values (1, 'FatMark', 92.53)")
-        assert False, "Exception have to be thrown"
-    except Exception as ex:
-        assert (
-            "DB::Exception: hadoop.security.kerberos.ticket.cache.path cannot be set per user"
-            in str(ex)
-        )
-
-
-if __name__ == "__main__":
-    cluster.start()
-    input("Cluster created, press any key to destroy...")
-    cluster.shutdown()
--- a/tests/performance/decimal_aggregates.xml
+++ b/tests/performance/decimal_aggregates.xml
@ -4,8 +4,13 @@
    </settings>

    <create_query>CREATE TABLE t (x UInt64, d32 Decimal32(3), d64 Decimal64(4), d128 Decimal128(5)) ENGINE = Memory</create_query>
-    <!-- use less threads to save memory -->
-    <fill_query>INSERT INTO t SELECT number AS x, x % 1000000 AS d32, x AS d64, x d128 FROM numbers_mt(500000000) SETTINGS max_threads = 8</fill_query>
+    <!-- use less threads and several queries to save memory -->
+    <fill_query>INSERT INTO t SELECT number AS x, x % 1000000 AS d32, x AS d64, x d128 FROM numbers_mt(100000000) SETTINGS max_threads = 2</fill_query>
+    <fill_query>INSERT INTO t SELECT number AS x, x % 1000000 AS d32, x AS d64, x d128 FROM numbers_mt(100000000, 100000000) SETTINGS max_threads = 2</fill_query>
+    <fill_query>INSERT INTO t SELECT number AS x, x % 1000000 AS d32, x AS d64, x d128 FROM numbers_mt(200000000, 100000000) SETTINGS max_threads = 2</fill_query>
+    <fill_query>INSERT INTO t SELECT number AS x, x % 1000000 AS d32, x AS d64, x d128 FROM numbers_mt(300000000, 100000000) SETTINGS max_threads = 2</fill_query>
+    <fill_query>INSERT INTO t SELECT number AS x, x % 1000000 AS d32, x AS d64, x d128 FROM numbers_mt(400000000, 100000000) SETTINGS max_threads = 2</fill_query>
+
    <drop_query>DROP TABLE IF EXISTS t</drop_query>

    <query>SELECT min(d32), max(d32), argMin(x, d32), argMax(x, d32) FROM t</query>
--- a/tests/queries/0_stateless/01042_system_reload_dictionary_reloads_completely.reference
+++ b/tests/queries/0_stateless/01042_system_reload_dictionary_reloads_completely.reference
@ -1,6 +1,6 @@
 12 -> 	102
 13 -> 	103
 14 -> 	-1
-12(r) -> 	102
-13(r) -> 	103
-14(r) -> 	104
+12 (after reloading) -> 	102
+13 (after reloading) -> 	103
+14 (after reloading) -> 	104
--- a/tests/queries/0_stateless/01042_system_reload_dictionary_reloads_completely.sh
+++ b/tests/queries/0_stateless/01042_system_reload_dictionary_reloads_completely.sh
@ -1,4 +1,6 @@
 #!/usr/bin/env bash
+# Tags: no-random-settings
+# Dictionaries are updated using the server time.

 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@ -6,8 +8,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

 set -e -o pipefail

-# NOTE: dictionaries TTLs works with server timezone, so session_timeout cannot be used
-$CLICKHOUSE_CLIENT --session_timezone '' --multiquery <<EOF
+$CLICKHOUSE_CLIENT --multiquery <<EOF
 CREATE TABLE ${CLICKHOUSE_DATABASE}.table(x Int64, y Int64, insert_time DateTime) ENGINE = MergeTree ORDER BY tuple();
 INSERT INTO ${CLICKHOUSE_DATABASE}.table VALUES (12, 102, now());

@ -28,16 +29,21 @@ $CLICKHOUSE_CLIENT --query "SELECT '12 -> ', dictGetInt64('${CLICKHOUSE_DATABASE
 $CLICKHOUSE_CLIENT --query "INSERT INTO ${CLICKHOUSE_DATABASE}.table VALUES (13, 103, now())"
 $CLICKHOUSE_CLIENT --query "INSERT INTO ${CLICKHOUSE_DATABASE}.table VALUES (14, 104, now() - INTERVAL 1 DAY)"

+# Wait when the dictionary will update the value for 13 on its own:
 while [ "$(${CLICKHOUSE_CLIENT} --query "SELECT dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(13))")" = -1 ]
-    do
-        sleep 0.5
-    done
+do
+    sleep 0.5
+done

 $CLICKHOUSE_CLIENT --query "SELECT '13 -> ', dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(13))"
+
+# By the way, the value for 14 is expected to not be updated at this moment,
+# because the values were selected by the update field insert_time, and for 14 it was set as one day ago.
 $CLICKHOUSE_CLIENT --query "SELECT '14 -> ', dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(14))"

+# SYSTEM RELOAD DICTIONARY reloads it completely, regardless of the update field, so we will see new values, even for key 14.
 $CLICKHOUSE_CLIENT --query "SYSTEM RELOAD DICTIONARY '${CLICKHOUSE_DATABASE}.dict'"

-$CLICKHOUSE_CLIENT --query "SELECT '12(r) -> ', dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(12))"
-$CLICKHOUSE_CLIENT --query "SELECT '13(r) -> ', dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(13))"
-$CLICKHOUSE_CLIENT --query "SELECT '14(r) -> ', dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(14))"
+$CLICKHOUSE_CLIENT --query "SELECT '12 (after reloading) -> ', dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(12))"
+$CLICKHOUSE_CLIENT --query "SELECT '13 (after reloading) -> ', dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(13))"
+$CLICKHOUSE_CLIENT --query "SELECT '14 (after reloading) -> ', dictGetInt64('${CLICKHOUSE_DATABASE}.dict', 'y', toUInt64(14))"
--- a/tests/queries/0_stateless/02481_async_insert_race_long.sh
+++ b/tests/queries/0_stateless/02481_async_insert_race_long.sh
@ -13,7 +13,7 @@ function insert1()
 {
    local TIMELIMIT=$((SECONDS+$1))
    while [ $SECONDS -lt "$TIMELIMIT" ]; do
-        ${MY_CLICKHOUSE_CLIENT} --wait_for_async_insert 0 -q 'INSERT INTO async_inserts_race FORMAT CSV 1,"a"'
+        ${MY_CLICKHOUSE_CLIENT} --insert_keeper_fault_injection_probability=0 --wait_for_async_insert 0 -q 'INSERT INTO async_inserts_race FORMAT CSV 1,"a"'
    done
 }

@ -21,7 +21,7 @@ function insert2()
 {
    local TIMELIMIT=$((SECONDS+$1))
    while [ $SECONDS -lt "$TIMELIMIT" ]; do
-        ${MY_CLICKHOUSE_CLIENT} --wait_for_async_insert 0 -q 'INSERT INTO async_inserts_race FORMAT JSONEachRow {"id": 5, "s": "e"} {"id": 6, "s": "f"}'
+        ${MY_CLICKHOUSE_CLIENT} --insert_keeper_fault_injection_probability=0 --wait_for_async_insert 0 -q 'INSERT INTO async_inserts_race FORMAT JSONEachRow {"id": 5, "s": "e"} {"id": 6, "s": "f"}'
    done
 }

@ -29,7 +29,7 @@ function insert3()
 {
    local TIMELIMIT=$((SECONDS+$1))
    while [ $SECONDS -lt "$TIMELIMIT" ]; do
-        ${MY_CLICKHOUSE_CLIENT} --wait_for_async_insert 1 -q "INSERT INTO async_inserts_race VALUES (7, 'g') (8, 'h')" &
+        ${MY_CLICKHOUSE_CLIENT} --insert_keeper_fault_injection_probability=0 --wait_for_async_insert 1 -q "INSERT INTO async_inserts_race VALUES (7, 'g') (8, 'h')" &
        sleep 0.05
    done

--- a/tests/queries/0_stateless/03205_parallel_replicas_alter_select_ubsan.reference
+++ b/tests/queries/0_stateless/03205_parallel_replicas_alter_select_ubsan.reference
--- a/tests/queries/0_stateless/03205_parallel_replicas_alter_select_ubsan.sql
+++ b/tests/queries/0_stateless/03205_parallel_replicas_alter_select_ubsan.sql
@ -0,0 +1,35 @@
+SET alter_sync = 2;
+SET max_parallel_replicas = 3, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_for_non_replicated_merge_tree = true;
+
+DROP TABLE IF EXISTS t1;
+DROP TABLE IF EXISTS t1__fuzz_26;
+
+CREATE TABLE t1__fuzz_26 (`a` Nullable(Float64), `b` Nullable(Float32), `pk` Int64) ENGINE = MergeTree ORDER BY pk;
+CREATE TABLE t1 ( a Float64, b Int64, pk String) Engine = MergeTree() ORDER BY pk;
+
+ALTER TABLE t1
+    (MODIFY COLUMN `a` Float64 TTL toDateTime(b) + toIntervalMonth(viewExplain('EXPLAIN', 'actions = 1', (
+        SELECT
+            toIntervalMonth(1),
+            2
+        FROM t1__fuzz_26
+        GROUP BY
+            toFixedString('%Prewhere%', 10),
+            toNullable(12)
+            WITH ROLLUP
+    )), 1)) settings allow_experimental_parallel_reading_from_replicas = 1; -- { serverError INCORRECT_RESULT_OF_SCALAR_SUBQUERY }
+
+ALTER TABLE t1
+    (MODIFY COLUMN `a` Float64 TTL toDateTime(b) + toIntervalMonth(viewExplain('EXPLAIN', 'actions = 1', (
+        SELECT
+            toIntervalMonth(1),
+            2
+        FROM t1__fuzz_26
+        GROUP BY
+            toFixedString('%Prewhere%', 10),
+            toNullable(12)
+            WITH ROLLUP
+    )), 1)) settings allow_experimental_parallel_reading_from_replicas = 0; -- { serverError INCORRECT_RESULT_OF_SCALAR_SUBQUERY }
+
+DROP TABLE t1;
+DROP TABLE t1__fuzz_26;
--- a/tests/queries/0_stateless/03208_numbers_total_rows_approx.reference
+++ b/tests/queries/0_stateless/03208_numbers_total_rows_approx.reference
@ -0,0 +1 @@
+2
--- a/tests/queries/0_stateless/03208_numbers_total_rows_approx.sql
+++ b/tests/queries/0_stateless/03208_numbers_total_rows_approx.sql
@ -0,0 +1 @@
+SELECT number FROM numbers(2, 1) WHERE number % 2 = 0 SETTINGS max_rows_to_read = 10;
				`@ -0,0 +1 @@`
				`SELECT number FROM numbers(2, 1) WHERE number % 2 = 0 SETTINGS max_rows_to_read = 10;`